5#include <unordered_set>
12#define DEFINE_VMAP() \
13 virtual std::pair<std::vector<array>, std::vector<int>> vmap( \
14 const std::vector<array>& inputs, const std::vector<int>& axes) \
17#define DEFINE_GRADS() \
18 std::vector<array> jvp( \
19 const std::vector<array>& primals, \
20 const std::vector<array>& tangents, \
21 const std::vector<int>& argnums) override; \
23 std::vector<array> vjp( \
24 const std::vector<array>& primals, \
25 const std::vector<array>& cotangents, \
26 const std::vector<int>& argnums, \
27 const std::vector<array>& outputs) override;
29#define DEFINE_PRINT(PRIMITIVE) \
30 void print(std::ostream& os) override { \
34#define DEFINE_DEFAULT_IS_EQUIVALENT() \
35 bool is_equivalent(const Primitive& other) const override { \
39#define DEFINE_INPUT_OUTPUT_SHAPE() \
40 std::vector<std::vector<int>> output_shapes( \
41 const std::vector<array>& inputs) override { \
42 return {inputs[0].shape()}; \
70 const std::vector<array>& inputs,
71 std::vector<array>& outputs) = 0;
73 const std::vector<array>& inputs,
74 std::vector<array>& outputs) = 0;
79 virtual std::vector<array>
jvp(
80 const std::vector<array>& primals,
81 const std::vector<array>& tangents,
82 const std::vector<int>& argnums);
87 virtual std::vector<array>
vjp(
88 const std::vector<array>& primals,
89 const std::vector<array>& cotangents,
90 const std::vector<int>& argnums,
91 const std::vector<array>& outputs);
99 virtual std::pair<std::vector<array>, std::vector<int>>
vmap(
100 const std::vector<array>& inputs,
101 const std::vector<int>& axes);
104 virtual void print(std::ostream& os) = 0;
114 const std::vector<array>& inputs);
138 const std::vector<array>& inputs,
139 std::vector<array>& outputs)
override {
143 const std::vector<array>& inputs,
144 std::vector<array>& outputs)
override {
169 void eval(const std::vector<
array>& inputs,
array& out);
186 void eval(const std::vector<
array>& inputs,
array& out);
198 const std::vector<array>& primals,
199 const std::vector<array>& cotangents,
200 const std::vector<int>& argnums,
201 const std::vector<array>& outputs)
override;
229 void eval(const std::vector<
array>& inputs,
array& out);
246 void eval(const std::vector<
array>& inputs,
array& out);
263 void eval(const std::vector<
array>& inputs,
array& out);
280 void eval(const std::vector<
array>& inputs,
array& out);
297 void eval(const std::vector<
array>& inputs,
array& out);
314 void eval(const std::vector<
array>& inputs,
array& out);
331 void eval(const std::vector<
array>& inputs,
array& out);
348 void eval(const std::vector<
array>& inputs,
array& out);
369 void eval(const std::vector<
array>& inputs,
array& out);
390 const std::vector<
array>& inputs) override;
396 void eval(const std::vector<
array>& inputs,
array& out);
415 void eval(const std::vector<
array>& inputs,
array& out);
435 void eval(const std::vector<
array>& inputs,
array& out);
442 std::vector<int> shape,
443 std::vector<size_t> strides,
446 shape_(
std::move(shape)),
447 strides_(
std::move(strides)),
458 std::vector<
int> shape_;
459 std::vector<
size_t> strides_;
462 void eval(const std::vector<
array>& inputs,
array& out);
478 void print(std::ostream& os) override;
494 const std::vector<array>& primals,
495 const std::vector<array>& cotangents,
496 const std::vector<int>& argnums,
497 const std::vector<array>& outputs)
override;
505 void eval(const std::vector<
array>& inputs,
array& out);
516 const std::vector<array>& primals,
517 const std::vector<array>& cotangents,
518 const std::vector<int>& argnums,
519 const std::vector<array>& outputs)
override;
525 void eval(const std::vector<
array>& inputs,
array& out);
542 std::vector<
int> shape_;
544 void eval(const std::vector<
array>& inputs,
array& out);
561 void eval(const std::vector<
array>& inputs,
array& out);
577 std::vector<array> inputs,
578 std::vector<array> outputs,
579 std::vector<array> tape,
580 std::unordered_set<uintptr_t> constant_ids);
582 void eval_cpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
584 void eval_gpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
590 const std::vector<
array>& inputs) override;
591 void print(std::ostream& os) override;
594 std::
string lib_name()
const {
599 const std::vector<array> inputs_;
600 const std::vector<array> outputs_;
601 const std::vector<array> tape_;
602 const std::unordered_set<uintptr_t> constant_ids_;
604 std::string kernel_lib_;
618 bool is_equivalent(const
Primitive& other) const override;
623 void eval(const std::vector<
array>& inputs,
array& out);
639 void eval(const std::vector<
array>& inputs,
array& out);
646 const std::vector<int>& kernel_strides,
647 const std::vector<int>& padding,
648 const std::vector<int>& kernel_dilation,
649 const std::vector<int>& input_dilation,
650 const int groups = 1,
651 const bool flip =
false)
654 kernel_strides_(kernel_strides),
655 kernel_dilation_(kernel_dilation),
656 input_dilation_(input_dilation),
664 const std::vector<array>& primals,
665 const std::vector<array>& cotangents,
666 const std::vector<int>& argnums,
667 const std::vector<array>& outputs)
override;
670 bool is_equivalent(const
Primitive& other) const override;
673 std::vector<
int> padding_;
674 std::vector<
int> kernel_strides_;
675 std::vector<
int> kernel_dilation_;
676 std::vector<
int> input_dilation_;
680 void eval(const std::vector<
array>& inputs,
array& out);
697 void eval(const std::vector<
array>& inputs,
array& out);
714 void eval(const std::vector<
array>& inputs,
array& out);
731 void eval(const std::vector<
array>& inputs,
array& out);
739 std::function<std::vector<array>(
740 const std::vector<array>&,
741 const std::vector<array>&,
742 const std::vector<array>&)> vjp,
743 std::function<std::vector<array>(
744 const std::vector<array>&,
745 const std::vector<array>&,
746 const std::vector<int>&)> jvp,
747 std::function<std::pair<std::vector<array>, std::vector<int>>(
748 const std::vector<array>&,
749 const std::vector<int>&)> vmap)
751 num_outputs_(num_outputs),
756 void eval_cpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
758 void eval_gpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
766 void eval(
const std::vector<array>& inputs, std::vector<array>& outputs);
770 std::function<std::vector<array>(
771 const std::vector<array>&,
772 const std::vector<array>&,
773 const std::vector<array>&)>
775 std::function<std::vector<array>(
776 const std::vector<array>&,
777 const std::vector<array>&,
778 const std::vector<int>&)>
780 std::function<std::pair<std::vector<array>, std::vector<int>>(
781 const std::vector<array>&,
782 const std::vector<int>&)>
790 void eval_cpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
792 void eval_gpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
796 const std::vector<array>& primals,
797 const std::vector<array>& cotan,
798 const std::vector<int>& argnums,
799 const std::vector<array>& outputs)
override;
804 void eval(
const std::vector<array>& inputs, std::vector<array>& outputs);
821 void eval(const std::vector<
array>& inputs,
array& out);
828 void eval_cpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
830 void eval_gpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
837 std::vector<std::vector<
int>> output_shapes(
838 const std::vector<
array>& inputs)
override {
839 return std::vector{inputs[0].shape(), inputs[0].shape()};
843 void eval(
const std::vector<array>& inputs, std::vector<array>& outputs);
860 void eval(const std::vector<
array>& inputs,
array& out);
877 void eval(const std::vector<
array>& inputs,
array& out);
893 void print(std::ostream& os)
override {
902 void eval(
const std::vector<array>& inputs,
array& out);
920 void eval(const std::vector<
array>& inputs,
array& out);
937 void eval(const std::vector<
array>& inputs,
array& out);
954 void eval(const std::vector<
array>& inputs,
array& out);
970 void eval(const std::vector<
array>& inputs,
array& out);
977 const std::vector<size_t>& axes,
989 bool is_equivalent(const
Primitive& other) const override;
992 std::vector<
size_t> axes_;
996 void eval(const std::vector<
array>& inputs,
array& out);
1013 void eval(const std::vector<
array>& inputs,
array& out);
1029 void eval(const std::vector<
array>& inputs,
array& out);
1036 const std::vector<int>& axes,
1037 const std::vector<int>& slice_sizes)
1038 :
UnaryPrimitive(stream), axes_(axes), slice_sizes_(slice_sizes) {}
1049 void eval(const std::vector<
array>& inputs,
array& out);
1050 std::vector<
int> axes_;
1051 std::vector<
int> slice_sizes_;
1068 void eval(const std::vector<
array>& inputs,
array& out);
1085 void eval(const std::vector<
array>& inputs,
array& out);
1106 void eval(const std::vector<
array>& inputs,
array& out);
1137 void eval(const std::vector<
array>& inputs,
array& out);
1154 void eval(const std::vector<
array>& inputs,
array& out);
1161 std::shared_ptr<io::Reader> reader,
1163 bool swap_endianness =
false)
1165 reader_(
std::move(reader)),
1167 swap_endianness_(swap_endianness) {
1168 if (stream.
device == Device::gpu) {
1180 static Stream io_stream = new_stream(Device::cpu);
1183 void eval(
const std::vector<array>& inputs,
array& out);
1184 std::shared_ptr<io::Reader> reader_;
1186 bool swap_endianness_;
1204 void print(std::ostream& os)
override {
1220 void eval(
const std::vector<array>& inputs,
array& out);
1236 void eval(const std::vector<
array>& inputs,
array& out);
1253 void eval(const std::vector<
array>& inputs,
array& out);
1270 void eval(const std::vector<
array>& inputs,
array& out);
1287 void eval(const std::vector<
array>& inputs,
array& out);
1304 void eval(const std::vector<
array>& inputs,
array& out);
1315 const std::vector<array>& primals,
1316 const std::vector<array>& cotangents,
1317 const std::vector<int>& argnums,
1318 const std::vector<array>& outputs)
override;
1339 void eval(const std::vector<
array>& inputs,
array& out);
1356 void eval(const std::vector<
array>& inputs,
array& out);
1373 void eval(const std::vector<
array>& inputs,
array& out);
1390 void eval(const std::vector<
array>& inputs,
array& out);
1407 void eval(const std::vector<
array>& inputs,
array& out);
1414 std::vector<int> axes,
1418 axes_(
std::move(axes)),
1419 inverted_(inverted),
1428 std::vector<std::vector<
int>> output_shapes(
1429 const std::vector<
array>& inputs)
override {
1434 std::vector<int> axes_;
1438 void eval(
const std::vector<array>& inputs,
array& out);
1445 const std::vector<int>& axes,
1446 const std::vector<int>& low_pad_size,
1447 const std::vector<int>& high_pad_size)
1450 low_pad_size_(low_pad_size),
1451 high_pad_size_(high_pad_size) {}
1462 std::vector<
int> axes_;
1463 std::vector<
int> low_pad_size_;
1464 std::vector<
int> high_pad_size_;
1466 void eval(const std::vector<
array>& inputs,
array& out);
1487 void eval(const std::vector<
array>& inputs,
array& out);
1504 void eval(const std::vector<
array>& inputs,
array& out);
1515 group_size_(group_size),
1532 void eval(const std::vector<
array>& inputs,
array& out);
1539 group_size_(group_size),
1556 void eval(const std::vector<
array>& inputs,
array& out);
1572 std::vector<
int> shape_;
1575 void eval(const std::vector<
array>& inputs,
array& out);
1606 std::vector<
int> shape_;
1608 void eval(const std::vector<
array>& inputs,
array& out);
1610 std::pair<
bool, std::vector<
size_t>> prepare_reshape(
1613 void shared_buffer_reshape(
1615 const std::vector<
size_t>& out_strides,
1626 const std::vector<int>& axes)
1627 :
UnaryPrimitive(stream), reduce_type_(reduce_type), axes_(axes) {}
1635 const std::vector<
array>& primals,
1636 const std::vector<
array>& cotangents,
1637 const std::vector<
int>& argnums,
1638 const std::vector<
array>& outputs) override;
1640 std::vector<std::vector<
int>> output_shapes(
1641 const std::vector<
array>& inputs) override;
1643 void print(std::ostream& os)
override {
1644 switch (reduce_type_) {
1669 std::vector<int> axes_;
1671 void eval(
const std::vector<array>& inputs,
array& out);
1688 void eval(const std::vector<
array>& inputs,
array& out);
1702 reduce_type_(reduce_type),
1705 inclusive_(inclusive) {}
1713 void print(std::ostream& os)
override {
1715 switch (reduce_type_) {
1738 void eval(
const std::vector<array>& inputs,
array& out);
1748 const std::vector<int>& axes)
1749 :
UnaryPrimitive(stream), reduce_type_(reduce_type), axes_(axes) {}
1759 switch (reduce_type_) {
1779 void eval(
const std::vector<array>& inputs,
array& out);
1781 std::vector<int> axes_;
1798 void eval(const std::vector<
array>& inputs,
array& out);
1815 void eval(const std::vector<
array>& inputs,
array& out);
1832 void eval(const std::vector<
array>& inputs,
array& out);
1849 void eval(const std::vector<
array>& inputs,
array& out);
1856 const std::vector<int>& start_indices,
1857 const std::vector<int>& end_indices,
1858 const std::vector<int>& strides)
1860 start_indices_(start_indices),
1861 end_indices_(end_indices),
1862 strides_(strides) {}
1873 std::vector<
int> start_indices_;
1874 std::vector<
int> end_indices_;
1875 std::vector<
int> strides_;
1877 void eval(const std::vector<
array>& inputs,
array& out);
1884 const std::vector<int>& start_indices,
1885 const std::vector<int>& end_indices,
1886 const std::vector<int>& strides)
1888 start_indices_(start_indices),
1889 end_indices_(end_indices),
1890 strides_(strides) {}
1901 std::vector<
int> start_indices_;
1902 std::vector<
int> end_indices_;
1903 std::vector<
int> strides_;
1905 void eval(const std::vector<
array>& inputs,
array& out);
1907 std::tuple<int64_t, std::vector<int64_t>> prepare_slice(const
array& in);
1926 void eval(const std::vector<
array>& inputs,
array& out);
1947 void eval(const std::vector<
array>& inputs,
array& out);
1952 explicit Split(
Stream stream,
const std::vector<int>& indices,
int axis)
1953 :
Primitive(stream), indices_(indices), axis_(axis) {}
1955 void eval_cpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
1957 void eval_gpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
1966 void eval(const std::vector<
array>& inputs, std::vector<
array>& outputs);
1968 std::vector<
int> indices_;
1986 void eval(const std::vector<
array>& inputs,
array& out);
2002 void print(std::ostream& os)
override {
2011 void eval(
const std::vector<array>& inputs,
array& out);
2028 void eval(const std::vector<
array>& inputs,
array& out);
2045 void eval(const std::vector<
array>& inputs,
array& out);
2062 void eval(const std::vector<
array>& inputs,
array& out);
2079 void eval(const std::vector<
array>& inputs,
array& out);
2094 void eval(const std::vector<
array>& inputs,
array& out);
2106 void print(std::ostream& os) override;
2127 std::vector<
int> axes_;
2129 void eval(const std::vector<
array>& inputs,
array& out);
2137 void eval_cpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
2139 void eval_gpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
2145 void eval(
const std::vector<array>& inputs, std::vector<array>& outputs);
2153 void eval_cpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
2155 void eval_gpu(
const std::vector<array>& inputs, std::vector<array>& outputs)
2162 void eval(const std::vector<
array>& inputs, std::vector<
array>& outputs);
2178 void eval(const std::vector<
array>& inputs,
array& output);
2195 void eval(const std::vector<
array>& inputs,
array& output);
Definition primitives.h:155
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Abs(Stream stream)
Definition primitives.h:157
void print(std::ostream &os) override
Print the primitive.
Definition primitives.h:164
std::vector< std::vector< int > > output_shapes(const std::vector< array > &inputs) override
Get the output shapes of the primitive.
Definition primitives.h:166
bool is_equivalent(const Primitive &other) const override
Equivalence check defaults to false unless overridden by the primitive.
Definition primitives.h:165
Definition primitives.h:172
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Add(Stream stream)
Definition primitives.h:174
Definition primitives.h:189
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
AddMM(Stream stream, float alpha, float beta)
Definition primitives.h:191
std::vector< array > vjp(const std::vector< array > &primals, const std::vector< array > &cotangents, const std::vector< int > &argnums, const std::vector< array > &outputs) override
The vector-Jacobian product.
Definition primitives.h:213
Arange(Stream stream, double start, double stop, double step)
Definition primitives.h:215
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:232
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
ArcCos(Stream stream)
Definition primitives.h:234
Definition primitives.h:249
void eval_cpu(const std::vector< array > &inputs, array &out) override
ArcCosh(Stream stream)
Definition primitives.h:251
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:266
void eval_gpu(const std::vector< array > &inputs, array &out) override
ArcSin(Stream stream)
Definition primitives.h:268
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:283
ArcSinh(Stream stream)
Definition primitives.h:285
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:317
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
ArcTan2(Stream stream)
Definition primitives.h:319
Definition primitives.h:300
void eval_cpu(const std::vector< array > &inputs, array &out) override
ArcTan(Stream stream)
Definition primitives.h:302
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:334
void eval_gpu(const std::vector< array > &inputs, array &out) override
ArcTanh(Stream stream)
Definition primitives.h:336
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:351
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
ArgPartition(Stream stream, int kth, int axis)
Definition primitives.h:353
Definition primitives.h:372
ReduceType
Definition primitives.h:374
@ ArgMin
Definition primitives.h:375
@ ArgMax
Definition primitives.h:376
ArgReduce(Stream stream, ReduceType reduce_type, int axis)
Definition primitives.h:379
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:399
void eval_cpu(const std::vector< array > &inputs, array &out) override
ArgSort(Stream stream, int axis)
Definition primitives.h:401
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:438
AsStrided(Stream stream, std::vector< int > shape, std::vector< size_t > strides, size_t offset)
Definition primitives.h:440
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:418
void eval_gpu(const std::vector< array > &inputs, array &out) override
AsType(Stream stream, Dtype dtype)
Definition primitives.h:420
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:465
BitwiseBinary(Stream stream, Op op)
Definition primitives.h:469
void eval_cpu(const std::vector< array > &inputs, array &out) override
Op
Definition primitives.h:467
@ And
Definition primitives.h:467
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:485
std::vector< array > vjp(const std::vector< array > &primals, const std::vector< array > &cotangents, const std::vector< int > &argnums, const std::vector< array > &outputs) override
The vector-Jacobian product.
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
BlockMaskedMM(Stream stream, int block_size)
Definition primitives.h:487
Definition primitives.h:528
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Broadcast(Stream stream, const std::vector< int > &shape)
Definition primitives.h:530
Definition primitives.h:547
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Ceil(Stream stream)
Definition primitives.h:549
Definition primitives.h:2183
void eval_cpu(const std::vector< array > &inputs, array &out) override
Cholesky(Stream stream, bool upper)
Definition primitives.h:2185
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:564
Compiled(Stream stream, std::vector< array > inputs, std::vector< array > outputs, std::vector< array > tape, std::unordered_set< uintptr_t > constant_ids)
void eval_gpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
void eval_cpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
A primitive must know how to evaluate itself on the CPU/GPU for the given inputs and populate the out...
Definition primitives.h:607
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Concatenate(Stream stream, int axis)
Definition primitives.h:609
Definition primitives.h:626
Conjugate(Stream stream)
Definition primitives.h:628
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:642
void eval_gpu(const std::vector< array > &inputs, array &out) override
Convolution(Stream stream, const std::vector< int > &kernel_strides, const std::vector< int > &padding, const std::vector< int > &kernel_dilation, const std::vector< int > &input_dilation, const int groups=1, const bool flip=false)
Definition primitives.h:644
void eval_cpu(const std::vector< array > &inputs, array &out) override
std::vector< array > vjp(const std::vector< array > &primals, const std::vector< array > &cotangents, const std::vector< int > &argnums, const std::vector< array > &outputs) override
The vector-Jacobian product.
Definition primitives.h:683
void eval_gpu(const std::vector< array > &inputs, array &out) override
Copy(Stream stream)
Definition primitives.h:685
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:700
void eval_cpu(const std::vector< array > &inputs, array &out) override
Cos(Stream stream)
Definition primitives.h:702
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:717
void eval_gpu(const std::vector< array > &inputs, array &out) override
Cosh(Stream stream)
Definition primitives.h:719
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:786
std::vector< array > vjp(const std::vector< array > &primals, const std::vector< array > &cotan, const std::vector< int > &argnums, const std::vector< array > &outputs) override
The vector-Jacobian product.
void eval_cpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
A primitive must know how to evaluate itself on the CPU/GPU for the given inputs and populate the out...
Depends(Stream stream)
Definition primitives.h:788
void eval_gpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
Definition primitives.h:824
void eval_gpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
DivMod(Stream stream)
Definition primitives.h:826
void eval_cpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
A primitive must know how to evaluate itself on the CPU/GPU for the given inputs and populate the out...
Definition primitives.h:807
Divide(Stream stream)
Definition primitives.h:809
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:880
Equal(Stream stream, bool equal_nan=false)
Definition primitives.h:882
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:906
Erf(Stream stream)
Definition primitives.h:908
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:923
void eval_gpu(const std::vector< array > &inputs, array &out) override
ErfInv(Stream stream)
Definition primitives.h:925
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:940
Exp(Stream stream)
Definition primitives.h:942
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:957
Expm1(Stream stream)
Definition primitives.h:959
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:973
FFT(Stream stream, const std::vector< size_t > &axes, bool inverse, bool real)
Definition primitives.h:975
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:999
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Floor(Stream stream)
Definition primitives.h:1001
Definition primitives.h:1016
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Full(Stream stream)
Definition primitives.h:1018
Definition primitives.h:1032
Gather(Stream stream, const std::vector< int > &axes, const std::vector< int > &slice_sizes)
Definition primitives.h:1034
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:508
void eval_cpu(const std::vector< array > &inputs, array &out) override
std::vector< array > vjp(const std::vector< array > &primals, const std::vector< array > &cotangents, const std::vector< int > &argnums, const std::vector< array > &outputs) override
The vector-Jacobian product.
void eval_gpu(const std::vector< array > &inputs, array &out) override
GatherMM(Stream stream)
Definition primitives.h:510
Definition primitives.h:1535
GatherQMM(Stream stream, int group_size, int bits, bool transpose)
Definition primitives.h:1537
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1071
void eval_cpu(const std::vector< array > &inputs, array &out) override
GreaterEqual(Stream stream)
Definition primitives.h:1073
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1054
Greater(Stream stream)
Definition primitives.h:1056
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1088
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Hadamard(Stream stream, float scale)
Definition primitives.h:1090
Definition primitives.h:1109
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Imag(Stream stream)
Definition primitives.h:1111
Definition primitives.h:2166
void eval_gpu(const std::vector< array > &inputs, array &output) override
Inverse(Stream stream, bool tri, bool upper)
Definition primitives.h:2168
void eval_cpu(const std::vector< array > &inputs, array &output) override
Definition primitives.h:1140
LessEqual(Stream stream)
Definition primitives.h:1142
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1123
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Less(Stream stream)
Definition primitives.h:1125
Definition primitives.h:1157
void eval_gpu(const std::vector< array > &inputs, array &out) override
Load(Stream stream, std::shared_ptr< io::Reader > reader, size_t offset, bool swap_endianness=false)
Definition primitives.h:1159
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1223
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Log1p(Stream stream)
Definition primitives.h:1225
Definition primitives.h:1290
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
LogAddExp(Stream stream)
Definition primitives.h:1292
Definition primitives.h:1189
Base
Definition primitives.h:1191
Log(Stream stream, Base base)
Definition primitives.h:1193
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1256
void eval_gpu(const std::vector< array > &inputs, array &out) override
LogicalAnd(Stream stream)
Definition primitives.h:1258
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1239
void eval_gpu(const std::vector< array > &inputs, array &out) override
LogicalNot(Stream stream)
Definition primitives.h:1241
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1273
void eval_cpu(const std::vector< array > &inputs, array &out) override
LogicalOr(Stream stream)
Definition primitives.h:1275
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1307
void eval_cpu(const std::vector< array > &inputs, array &out) override
std::vector< array > vjp(const std::vector< array > &primals, const std::vector< array > &cotangents, const std::vector< int > &argnums, const std::vector< array > &outputs) override
The vector-Jacobian product.
void eval_gpu(const std::vector< array > &inputs, array &out) override
Matmul(Stream stream)
Definition primitives.h:1309
Definition primitives.h:1325
Maximum(Stream stream)
Definition primitives.h:1327
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1342
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Minimum(Stream stream)
Definition primitives.h:1344
Definition primitives.h:1359
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Multiply(Stream stream)
Definition primitives.h:1361
Definition primitives.h:1376
void eval_gpu(const std::vector< array > &inputs, array &out) override
Negative(Stream stream)
Definition primitives.h:1378
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1393
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
NotEqual(Stream stream)
Definition primitives.h:1395
Definition primitives.h:1410
void eval_gpu(const std::vector< array > &inputs, array &out) override
NumberOfElements(Stream stream, std::vector< int > axes, bool inverted, Dtype dtype)
Definition primitives.h:1412
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1441
void eval_cpu(const std::vector< array > &inputs, array &out) override
Pad(Stream stream, const std::vector< int > &axes, const std::vector< int > &low_pad_size, const std::vector< int > &high_pad_size)
Definition primitives.h:1443
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1469
void eval_cpu(const std::vector< array > &inputs, array &out) override
Partition(Stream stream, int kth, int axis)
Definition primitives.h:1471
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1490
void eval_cpu(const std::vector< array > &inputs, array &out) override
Power(Stream stream)
Definition primitives.h:1492
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:48
virtual void eval_cpu(const std::vector< array > &inputs, std::vector< array > &outputs)=0
A primitive must know how to evaluate itself on the CPU/GPU for the given inputs and populate the out...
virtual std::vector< array > vjp(const std::vector< array > &primals, const std::vector< array > &cotangents, const std::vector< int > &argnums, const std::vector< array > &outputs)
The vector-Jacobian product.
virtual ~Primitive()=default
Primitive(const Primitive &other)=delete
Primitive(Primitive &&other)=delete
const Stream & stream()
The stream the primitive will run on.
Definition primitives.h:58
Primitive & operator=(Primitive &&other)=delete
virtual bool is_equivalent(const Primitive &other) const
Equivalence check defaults to false unless overridden by the primitive.
Definition primitives.h:107
Primitive & operator=(const Primitive &other)=delete
virtual std::vector< std::vector< int > > output_shapes(const std::vector< array > &inputs)
Get the output shapes of the primitive.
const Device & device()
The device the primitive will run on.
Definition primitives.h:53
virtual std::vector< array > jvp(const std::vector< array > &primals, const std::vector< array > &tangents, const std::vector< int > &argnums)
The Jacobian-vector product.
virtual std::pair< std::vector< array >, std::vector< int > > vmap(const std::vector< array > &inputs, const std::vector< int > &axes)
The primitive must know how to vectorize itself across the given axes.
virtual void eval_gpu(const std::vector< array > &inputs, std::vector< array > &outputs)=0
virtual void print(std::ostream &os)=0
Print the primitive.
Primitive(Stream stream)
Definition primitives.h:50
Definition primitives.h:2133
QRF(Stream stream)
Definition primitives.h:2135
void eval_cpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
A primitive must know how to evaluate itself on the CPU/GPU for the given inputs and populate the out...
void eval_gpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
Definition primitives.h:1507
void eval_gpu(const std::vector< array > &inputs, array &out) override
QuantizedMatmul(Stream stream, int group_size, int bits, bool transpose)
Definition primitives.h:1509
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1559
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
RandomBits(Stream stream, const std::vector< int > &shape, int width)
Definition primitives.h:1561
Definition primitives.h:1578
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Real(Stream stream)
Definition primitives.h:1580
Definition primitives.h:1619
Reduce(Stream stream, ReduceType reduce_type, const std::vector< int > &axes)
Definition primitives.h:1623
ReduceType
Definition primitives.h:1621
@ And
Definition primitives.h:1621
bool is_equivalent(const Primitive &other) const override
Equivalence check defaults to false unless overridden by the primitive.
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:863
Remainder(Stream stream)
Definition primitives.h:865
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1592
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Reshape(Stream stream, const std::vector< int > &shape)
Definition primitives.h:1594
Definition primitives.h:1674
Round(Stream stream)
Definition primitives.h:1676
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:2149
void eval_cpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
A primitive must know how to evaluate itself on the CPU/GPU for the given inputs and populate the out...
void eval_gpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
SVD(Stream stream)
Definition primitives.h:2151
Definition primitives.h:1691
void eval_cpu(const std::vector< array > &inputs, array &out) override
ReduceType
Definition primitives.h:1693
@ Max
Definition primitives.h:1693
bool is_equivalent(const Primitive &other) const override
Equivalence check defaults to false unless overridden by the primitive.
Scan(Stream stream, ReduceType reduce_type, int axis, bool reverse, bool inclusive)
Definition primitives.h:1695
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1741
bool is_equivalent(const Primitive &other) const override
Equivalence check defaults to false unless overridden by the primitive.
ReduceType
Definition primitives.h:1743
@ Max
Definition primitives.h:1743
void eval_cpu(const std::vector< array > &inputs, array &out) override
void print(std::ostream &os) override
Print the primitive.
Definition primitives.h:1757
void eval_gpu(const std::vector< array > &inputs, array &out) override
Scatter(Stream stream, ReduceType reduce_type, const std::vector< int > &axes)
Definition primitives.h:1745
Definition primitives.h:846
void eval_gpu(const std::vector< array > &inputs, array &out) override
Select(Stream stream)
Definition primitives.h:848
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1784
Sigmoid(Stream stream)
Definition primitives.h:1786
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1801
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Sign(Stream stream)
Definition primitives.h:1803
Definition primitives.h:1818
Sin(Stream stream)
Definition primitives.h:1820
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1835
Sinh(Stream stream)
Definition primitives.h:1837
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1852
void eval_cpu(const std::vector< array > &inputs, array &out) override
Slice(Stream stream, const std::vector< int > &start_indices, const std::vector< int > &end_indices, const std::vector< int > &strides)
Definition primitives.h:1854
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1880
SliceUpdate(Stream stream, const std::vector< int > &start_indices, const std::vector< int > &end_indices, const std::vector< int > &strides)
Definition primitives.h:1882
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1910
void eval_gpu(const std::vector< array > &inputs, array &out) override
Softmax(Stream stream, bool precise)
Definition primitives.h:1912
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1930
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Sort(Stream stream, int axis)
Definition primitives.h:1932
Definition primitives.h:1950
void eval_gpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
Split(Stream stream, const std::vector< int > &indices, int axis)
Definition primitives.h:1952
void eval_cpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
A primitive must know how to evaluate itself on the CPU/GPU for the given inputs and populate the out...
Definition primitives.h:1989
void eval_cpu(const std::vector< array > &inputs, array &out) override
Sqrt(Stream stream, bool recip=false)
Definition primitives.h:1991
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:1972
void eval_gpu(const std::vector< array > &inputs, array &out) override
void eval_cpu(const std::vector< array > &inputs, array &out) override
Square(Stream stream)
Definition primitives.h:1974
Definition primitives.h:2015
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
StopGradient(Stream stream)
Definition primitives.h:2017
Definition primitives.h:2031
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Subtract(Stream stream)
Definition primitives.h:2033
Definition primitives.h:2048
Tan(Stream stream)
Definition primitives.h:2050
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:2065
void eval_gpu(const std::vector< array > &inputs, array &out) override
Tanh(Stream stream)
Definition primitives.h:2067
void eval_cpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:2113
Transpose(Stream stream, const std::vector< int > &axes)
Definition primitives.h:2115
void eval_cpu(const std::vector< array > &inputs, array &out) override
void eval_gpu(const std::vector< array > &inputs, array &out) override
Definition primitives.h:127
UnaryPrimitive & operator=(const UnaryPrimitive &other)=delete
UnaryPrimitive(Stream stream)
An abstract base class for a primitive with a single output.
Definition primitives.h:132
virtual void eval_gpu(const std::vector< array > &inputs, array &output)=0
UnaryPrimitive(UnaryPrimitive &&other)=delete
virtual void eval_cpu(const std::vector< array > &inputs, array &output)=0
void eval_gpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
Definition primitives.h:142
UnaryPrimitive(const UnaryPrimitive &other)=delete
void eval_cpu(const std::vector< array > &inputs, std::vector< array > &outputs) override
A primitive must know how to evaluate itself on the CPU/GPU for the given inputs and populate the out...
Definition primitives.h:137
UnaryPrimitive & operator=(UnaryPrimitive &&other)=delete
virtual ~UnaryPrimitive()=default
Definition primitives.h:2097
void eval_cpu(const std::vector< array > &inputs, array &out) override
View(Stream stream, Dtype dtype)
Definition primitives.h:2099
void eval_gpu(const std::vector< array > &inputs, array &out) override
Op op
Definition binary.h:129
array std(const array &a, bool keepdims, int ddof=0, StreamOrDevice s={})
Computes the standard deviation of the elements of an array.
array tri(int n, int m, int k, Dtype type, StreamOrDevice s={})
array transpose(const array &a, std::vector< int > axes, StreamOrDevice s={})
Permutes the dimensions according to the given axes.
array real(const array &a, StreamOrDevice s={})
std::pair< std::vector< array >, std::vector< array > > jvp(const std::function< std::vector< array >(const std::vector< array > &)> &fun, const std::vector< array > &primals, const std::vector< array > &tangents)
Computes the output and Jacobian-vector product (JVP) of a function.
std::pair< std::vector< array >, std::vector< array > > vjp(const std::function< std::vector< array >(const std::vector< array > &)> &fun, const std::vector< array > &primals, const std::vector< array > &cotangents)
Computes the output and vector-Jacobian product (VJP) of a function.
void eval(std::vector< array > outputs)
std::function< array(const array &)> vmap(const std::function< array(const array &)> &fun, int in_axis=0, int out_axis=0)
Automatically vectorize a unary function over the requested axes.
#define DEFINE_DEFAULT_IS_EQUIVALENT()
Definition primitives.h:34
#define DEFINE_PRINT(PRIMITIVE)
Definition primitives.h:29
#define DEFINE_INPUT_OUTPUT_SHAPE()
Definition primitives.h:39
#define DEFINE_GRADS()
Definition primitives.h:17
#define DEFINE_VMAP()
Definition primitives.h:12
Definition binary_ops.h:270
Definition binary_ops.h:277
Device device
Definition stream.h:11