Reduce a little overhead (#871)

* some small overhead improvements

* use result_type in rms_norm

* remove release force

* fix + use non-vector version

* revert compile change

* fix ops

* a little more overhead

* a little more cleanup and overhead
This commit is contained in:
Awni Hannun
2024-03-22 17:29:36 -07:00
committed by GitHub
parent 6ee1112f30
commit be98f4ab6b
13 changed files with 239 additions and 240 deletions

View File

@@ -158,9 +158,7 @@ array expand_dims(
StreamOrDevice s = {});
/** Add a singleton dimension at the given axis. */
inline array expand_dims(const array& a, int axis, StreamOrDevice s = {}) {
return expand_dims(a, std::vector<int>{axis}, s);
}
array expand_dims(const array& a, int axis, StreamOrDevice s = {});
/** Slice an array. */
array slice(