.. | ||
0001-add-detokenize-endpoint.patch | ||
0001-copy-cuda-runtime-libraries.patch | ||
0001-metal-handle-ggml_scale-for-n-4-0-close-3754.patch | ||
0001-update-default-log-target.patch | ||
0002-34B-model-support.patch | ||
0003-metal-fix-synchronization-in-new-matrix-multiplicati.patch | ||
0004-metal-add-missing-barriers-for-mul-mat-2699.patch | ||
0005-ggml-support-CUDA-s-half-type-for-aarch64-1455-2670.patch |