diff --git a/llama_cpp/server/settings.py b/llama_cpp/server/settings.py index 8989ffa..8ac8df8 100644 --- a/llama_cpp/server/settings.py +++ b/llama_cpp/server/settings.py @@ -143,10 +143,6 @@ class ModelSettings(BaseSettings): default=None, description="The model name or path to a pretrained HuggingFace tokenizer model. Same as you would pass to AutoTokenizer.from_pretrained().", ) - hf_model_repo_id: Optional[str] = Field( - default=None, - description="The HuggingFace repo_id to use to load model files from", - ) # Speculative Decoding draft_model: Optional[str] = Field( default=None,