add command-r graph estimate

This commit is contained in:
Michael Yang 2024-04-04 13:24:20 -07:00
parent 483b81a863
commit 01f77ae25d

View file

@ -327,7 +327,7 @@ func (llm GGML) GraphSize(context, batch int) (int64, bool) {
}
switch llm.KV().Architecture() {
case "gemma":
case "gemma", "command-r":
return 4 * int64(batch) * int64(embeddingLength+uint64(vocabLength)), true
case "phi2":
return max(