support new "longrope" attention factor

This commit is contained in:
Bruce MacDonald 2024-07-02 14:40:01 -07:00 committed by Michael Yang
parent 6ffb5cb017
commit aec77d6a05

View file

@ -58,7 +58,7 @@ func (p *phi3) KV(t *Tokenizer) llm.KV {
switch p.RopeScaling.Type {
case "":
// no scaling
case "su":
case "su", "longrope":
kv["phi3.rope.scaling.attn_factor"] = float32(max(math.Sqrt(1+math.Log(scale)/math.Log(float64(p.OriginalMaxPositionEmbeddings))), 1.0))
case "yarn":
kv["phi3.rope.scaling.attn_factor"] = float32(max(0.1*math.Log(scale)+1.0, 1.0))