Update n_batch for server
This commit is contained in:
parent
cc706fb944
commit
3cab3ef4cb
1 changed files with 1 additions and 1 deletions
|
@ -28,7 +28,7 @@ from sse_starlette.sse import EventSourceResponse
|
|||
class Settings(BaseSettings):
|
||||
model: str
|
||||
n_ctx: int = 2048
|
||||
n_batch: int = 8
|
||||
n_batch: int = 512
|
||||
n_threads: int = max((os.cpu_count() or 2) // 2, 1)
|
||||
f16_kv: bool = True
|
||||
use_mlock: bool = False # This causes a silent failure on platforms that don't support mlock (e.g. Windows) took forever to figure out...
|
||||
|
|
Loading…
Reference in a new issue