2024-05-31 20:00:49 -07:00
|
|
|
package convert
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
|
|
|
"encoding/binary"
|
|
|
|
"encoding/json"
|
2024-08-27 17:54:04 -07:00
|
|
|
"errors"
|
2024-05-31 20:00:49 -07:00
|
|
|
"fmt"
|
|
|
|
"io"
|
2024-06-29 16:53:59 -07:00
|
|
|
"io/fs"
|
2024-05-31 20:00:49 -07:00
|
|
|
"slices"
|
2024-06-28 13:27:05 -07:00
|
|
|
"strings"
|
2024-05-31 20:00:49 -07:00
|
|
|
|
|
|
|
"github.com/d4l3k/go-bfloat16"
|
|
|
|
"github.com/x448/float16"
|
|
|
|
"golang.org/x/exp/maps"
|
|
|
|
)
|
|
|
|
|
|
|
|
type safetensorMetadata struct {
|
|
|
|
Type string `json:"dtype"`
|
|
|
|
Shape []uint64 `json:"shape"`
|
|
|
|
Offsets []int64 `json:"data_offsets"`
|
|
|
|
}
|
|
|
|
|
2024-06-28 13:27:05 -07:00
|
|
|
func parseSafetensors(fsys fs.FS, replacer *strings.Replacer, ps ...string) ([]Tensor, error) {
|
2024-05-31 20:00:49 -07:00
|
|
|
var ts []Tensor
|
|
|
|
for _, p := range ps {
|
2024-06-29 16:53:59 -07:00
|
|
|
f, err := fsys.Open(p)
|
2024-05-31 20:00:49 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer f.Close()
|
|
|
|
|
|
|
|
var n int64
|
|
|
|
if err := binary.Read(f, binary.LittleEndian, &n); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
b := bytes.NewBuffer(make([]byte, 0, n))
|
|
|
|
if _, err = io.CopyN(b, f, n); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
var headers map[string]safetensorMetadata
|
|
|
|
if err := json.NewDecoder(b).Decode(&headers); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
keys := maps.Keys(headers)
|
|
|
|
slices.Sort(keys)
|
|
|
|
|
2024-09-05 17:02:28 -07:00
|
|
|
names := make(map[string]struct{}, len(keys))
|
|
|
|
|
2024-05-31 20:00:49 -07:00
|
|
|
for _, key := range keys {
|
|
|
|
if value := headers[key]; value.Type != "" {
|
2024-08-27 17:54:04 -07:00
|
|
|
// bitsandbytes quantized models are unsupported
|
|
|
|
if len(value.Shape) == 0 {
|
|
|
|
return nil, errors.New("unsupported safetensors model")
|
|
|
|
}
|
2024-09-05 17:02:28 -07:00
|
|
|
ggufName := replacer.Replace(key)
|
|
|
|
if _, ok := names[ggufName]; ok {
|
|
|
|
return nil, fmt.Errorf("duplicate tensor name '%s' was found for this model", ggufName)
|
|
|
|
}
|
|
|
|
names[ggufName] = struct{}{}
|
2024-05-31 20:00:49 -07:00
|
|
|
ts = append(ts, safetensor{
|
2024-06-29 16:53:59 -07:00
|
|
|
fs: fsys,
|
2024-05-31 20:00:49 -07:00
|
|
|
path: p,
|
|
|
|
dtype: value.Type,
|
|
|
|
offset: safetensorsPad(n, value.Offsets[0]),
|
|
|
|
size: safetensorsPad(n, value.Offsets[1]) - safetensorsPad(n, value.Offsets[0]),
|
|
|
|
tensorBase: &tensorBase{
|
2024-09-05 17:02:28 -07:00
|
|
|
name: ggufName,
|
2024-05-31 20:00:49 -07:00
|
|
|
shape: value.Shape,
|
|
|
|
},
|
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return ts, nil
|
|
|
|
}
|
|
|
|
|
2024-07-08 16:59:48 -07:00
|
|
|
// safetensorsPad returns the padded size of the safetensors file given a length n and offset s
|
2024-07-31 10:58:22 -07:00
|
|
|
func safetensorsPad(n, offset int64) int64 {
|
|
|
|
return 8 + n + offset
|
2024-05-31 20:00:49 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
type safetensor struct {
|
2024-06-29 16:53:59 -07:00
|
|
|
fs fs.FS
|
2024-05-31 20:00:49 -07:00
|
|
|
path string
|
|
|
|
dtype string
|
|
|
|
offset int64
|
|
|
|
size int64
|
|
|
|
*tensorBase
|
|
|
|
}
|
|
|
|
|
|
|
|
func (st safetensor) WriteTo(w io.Writer) (int64, error) {
|
2024-06-29 16:53:59 -07:00
|
|
|
f, err := st.fs.Open(st.path)
|
2024-05-31 20:00:49 -07:00
|
|
|
if err != nil {
|
|
|
|
return 0, err
|
|
|
|
}
|
|
|
|
defer f.Close()
|
|
|
|
|
2024-06-29 16:53:59 -07:00
|
|
|
if seeker, ok := f.(io.Seeker); ok {
|
|
|
|
if _, err := seeker.Seek(st.offset, io.SeekStart); err != nil {
|
|
|
|
return 0, err
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if _, err := io.CopyN(io.Discard, f, st.offset); err != nil {
|
|
|
|
return 0, err
|
|
|
|
}
|
2024-05-31 20:00:49 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
var f32s []float32
|
|
|
|
switch st.dtype {
|
|
|
|
case "F32":
|
|
|
|
f32s = make([]float32, st.size/4)
|
|
|
|
if err = binary.Read(f, binary.LittleEndian, f32s); err != nil {
|
|
|
|
return 0, err
|
|
|
|
}
|
|
|
|
case "F16":
|
|
|
|
u16s := make([]uint16, st.size/2)
|
|
|
|
if err = binary.Read(f, binary.LittleEndian, u16s); err != nil {
|
|
|
|
return 0, err
|
|
|
|
}
|
|
|
|
|
2024-08-01 14:52:15 -07:00
|
|
|
f32s = make([]float32, len(u16s))
|
|
|
|
for i := range u16s {
|
|
|
|
f32s[i] = float16.Frombits(u16s[i]).Float32()
|
2024-05-31 20:00:49 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
case "BF16":
|
|
|
|
u8s := make([]uint8, st.size)
|
|
|
|
if err = binary.Read(f, binary.LittleEndian, u8s); err != nil {
|
|
|
|
return 0, err
|
|
|
|
}
|
|
|
|
|
|
|
|
f32s = bfloat16.DecodeFloat32(u8s)
|
|
|
|
default:
|
|
|
|
return 0, fmt.Errorf("unknown data type: %s", st.dtype)
|
|
|
|
}
|
|
|
|
|
|
|
|
if st.repacker != nil {
|
|
|
|
f32s, err = st.repacker(st.Name(), f32s, st.Shape())
|
|
|
|
if err != nil {
|
|
|
|
return 0, err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
switch st.Kind() {
|
2024-07-08 16:59:48 -07:00
|
|
|
case tensorKindF32:
|
2024-05-31 20:00:49 -07:00
|
|
|
return 0, binary.Write(w, binary.LittleEndian, f32s)
|
2024-07-08 16:59:48 -07:00
|
|
|
case tensorKindF16:
|
2024-05-31 20:00:49 -07:00
|
|
|
f16s := make([]uint16, len(f32s))
|
|
|
|
for i := range f32s {
|
|
|
|
f16s[i] = float16.Fromfloat32(f32s[i]).Bits()
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0, binary.Write(w, binary.LittleEndian, f16s)
|
|
|
|
default:
|
|
|
|
return 0, fmt.Errorf("unknown storage type: %d", st.Kind())
|
|
|
|
}
|
|
|
|
}
|