fix: wrong parameter for flash attention in pickle __getstate__
This commit is contained in:
parent
22d77eefd2
commit
29b6e9a5c8
1 changed files with 1 additions and 1 deletions
|
@ -1777,7 +1777,7 @@ class Llama:
|
||||||
logits_all=self.context_params.logits_all,
|
logits_all=self.context_params.logits_all,
|
||||||
embedding=self.context_params.embeddings,
|
embedding=self.context_params.embeddings,
|
||||||
offload_kqv=self.context_params.offload_kqv,
|
offload_kqv=self.context_params.offload_kqv,
|
||||||
flash_offload=self.context_params.flash_offload,
|
flash_attn=self.context_params.flash_attn,
|
||||||
# Sampling Params
|
# Sampling Params
|
||||||
last_n_tokens_size=self.last_n_tokens_size,
|
last_n_tokens_size=self.last_n_tokens_size,
|
||||||
# LoRA Params
|
# LoRA Params
|
||||||
|
|
Loading…
Reference in a new issue