Merge pull request #3466 from ollama/mxyng/head-kv
default head_kv to 1
This commit is contained in:
commit
4f895d633f
1 changed files with 6 additions and 6 deletions
12
llm/ggml.go
12
llm/ggml.go
|
@ -148,15 +148,15 @@ func (kv KV) HeadCount() uint64 {
|
||||||
}
|
}
|
||||||
|
|
||||||
func (kv KV) HeadCountKV() uint64 {
|
func (kv KV) HeadCountKV() uint64 {
|
||||||
return kv.u64(fmt.Sprintf("%s.attention.head_count_kv", kv.Architecture()))
|
if headCountKV := kv.u64(fmt.Sprintf("%s.attention.head_count_kv", kv.Architecture())); headCountKV > 0 {
|
||||||
|
return headCountKV
|
||||||
|
}
|
||||||
|
|
||||||
|
return 1
|
||||||
}
|
}
|
||||||
|
|
||||||
func (kv KV) GQA() uint64 {
|
func (kv KV) GQA() uint64 {
|
||||||
if headCountKV := kv.HeadCountKV(); headCountKV > 0 {
|
return kv.HeadCount() / kv.HeadCountKV()
|
||||||
return kv.HeadCount() / headCountKV
|
|
||||||
}
|
|
||||||
|
|
||||||
return 0
|
|
||||||
}
|
}
|
||||||
|
|
||||||
func (kv KV) EmbeddingLength() uint64 {
|
func (kv KV) EmbeddingLength() uint64 {
|
||||||
|
|
Loading…
Reference in a new issue