91b3e4d282
count each layer independently when deciding gpu offloading |
||
---|---|---|
.. | ||
ext_server | ||
generate | ||
llama.cpp@ad3a0505e3 | ||
patches | ||
dyn_ext_server.c | ||
dyn_ext_server.go | ||
dyn_ext_server.h | ||
ggla.go | ||
ggml.go | ||
gguf.go | ||
llama.go | ||
llm.go | ||
payload_common.go | ||
payload_darwin_amd64.go | ||
payload_darwin_arm64.go | ||
payload_linux.go | ||
payload_test.go | ||
payload_windows.go | ||
utils.go |