Override numParallel only if unset.

This commit is contained in:
Richard Lyons 2024-08-18 01:43:26 +02:00
parent d29cd4c2ed
commit 0ad0e738cd

View file

@ -734,7 +734,9 @@ func pickBestFullFitByLibrary(req *LlmRequest, ggml *llm.GGML, gpus gpu.GpuInfoL
// If multiple Libraries are detected, pick the Library which loads the most layers for the model
func pickBestPartialFitByLibrary(req *LlmRequest, ggml *llm.GGML, gpus gpu.GpuInfoList, numParallel *int) gpu.GpuInfoList {
*numParallel = 1
if *numParallel <= 0 {
*numParallel = 1
}
byLibrary := gpus.ByLibrary()
if len(byLibrary) <= 1 {
return gpus