diff --git a/llama_cpp/llama.py b/llama_cpp/llama.py index 8076548..c696804 100644 --- a/llama_cpp/llama.py +++ b/llama_cpp/llama.py @@ -904,7 +904,7 @@ class Llama: ) self.context_params.yarn_orig_ctx = yarn_orig_ctx if yarn_orig_ctx != 0 else 0 self.context_params.mul_mat_q = mul_mat_q - self.context_params.f16_kv = f16_kv + # self.context_params.f16_kv = f16_kv self.context_params.logits_all = logits_all self.context_params.embedding = embedding