use a bool mask for attention (#1319)

This commit is contained in:
Awni Hannun
2025-03-04 12:47:32 -08:00
committed by GitHub
parent 1bc3476a46
commit 65aa2ec849
2 changed files with 5 additions and 6 deletions

View File

@@ -152,7 +152,7 @@ def setup_arg_parser():
"--num-draft-tokens",
type=int,
help="Number of tokens to draft when using speculative decoding.",
default=2,
default=3,
)
return parser