Handle longer prompt/generation (#931)

* rebase

* nits

* nit

* fix rotating cache with step prefill

* update version
This commit is contained in:
Awni Hannun
2024-08-16 15:28:39 -07:00
committed by GitHub
parent e196fa3208
commit 7be292c0c9
32 changed files with 255 additions and 13 deletions

View File

@@ -1,3 +1,5 @@
# Copyright © 2023-2024 Apple Inc.
from dataclasses import dataclass
from typing import Any, List, Optional, Tuple, Union