Set kv cache size to f16 by default

This commit is contained in:
Andrei Betlen 2023-04-14 22:21:19 -04:00
parent 9c8c2c37dc
commit 6e298d8fca

View file

@ -21,7 +21,7 @@ class Llama:
n_ctx: int = 512,
n_parts: int = -1,
seed: int = 1337,
f16_kv: bool = False,
f16_kv: bool = True,
logits_all: bool = False,
vocab_only: bool = False,
use_mmap: bool = True,