Merge pull request #3496 from ollama/mxyng/cmd-r-graph

add command-r graph estimate
This commit is contained in:
Michael Yang 2024-04-05 12:26:21 -07:00 committed by GitHub
commit fc8e108642
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -327,7 +327,7 @@ func (llm GGML) GraphSize(context, batch int) (int64, bool) {
}
switch llm.KV().Architecture() {
case "gemma":
case "gemma", "command-r":
return 4 * int64(batch) * int64(embeddingLength+uint64(vocabLength)), true
case "phi2":
return max(