reader.go 1.47 KB
Newer Older
Michael Yang's avatar
Michael Yang committed
1
2
3
4
5
package convert

import (
	"errors"
	"io"
6
	"io/fs"
Michael Yang's avatar
Michael Yang committed
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
	"strings"
)

type Tensor interface {
	Name() string
	Shape() []uint64
	Kind() uint32
	SetRepacker(repacker)
	WriteTo(io.Writer) (int64, error)
}

type tensorBase struct {
	name  string
	shape []uint64
	repacker
}

func (t tensorBase) Name() string {
	return t.name
}

func (t tensorBase) Shape() []uint64 {
	return t.shape
}

Michael Yang's avatar
Michael Yang committed
32
33
34
35
36
const (
	tensorKindF32 uint32 = iota
	tensorKindF16
)

Michael Yang's avatar
Michael Yang committed
37
38
39
func (t tensorBase) Kind() uint32 {
	if strings.HasSuffix(t.name, ".block_sparse_moe.gate.weight") {
		return 0
Michael Yang's avatar
bert  
Michael Yang committed
40
41
	} else if t.name == "embeddings.token_type_embeddings.weight" {
		return 0
Michael Yang's avatar
Michael Yang committed
42
43
44
45
46
47
	}

	switch len(t.shape) {
	case 0:
		panic("invalid tensor shape")
	case 1:
Michael Yang's avatar
Michael Yang committed
48
		return tensorKindF32
Michael Yang's avatar
Michael Yang committed
49
	default:
Michael Yang's avatar
Michael Yang committed
50
		return tensorKindF16
Michael Yang's avatar
Michael Yang committed
51
52
53
54
55
56
57
58
59
	}
}

func (t *tensorBase) SetRepacker(fn repacker) {
	t.repacker = fn
}

type repacker func(string, []float32, []uint64) ([]float32, error)

60
func parseTensors(fsys fs.FS) ([]Tensor, error) {
Michael Yang's avatar
Michael Yang committed
61
62
63
64
65
66
67
68
69
	patterns := []struct {
		Pattern string
		Func    func(fs.FS, ...string) ([]Tensor, error)
	}{
		{"model-*-of-*.safetensors", parseSafetensors},
		{"model.safetensors", parseSafetensors},
		{"pytorch_model-*-of-*.bin", parseTorch},
		{"pytorch_model.bin", parseTorch},
		{"consolidated.*.pth", parseTorch},
Michael Yang's avatar
Michael Yang committed
70
71
	}

Michael Yang's avatar
Michael Yang committed
72
73
	for _, pattern := range patterns {
		matches, err := fs.Glob(fsys, pattern.Pattern)
Michael Yang's avatar
Michael Yang committed
74
75
76
77
78
		if err != nil {
			return nil, err
		}

		if len(matches) > 0 {
Michael Yang's avatar
Michael Yang committed
79
			return pattern.Func(fsys, matches...)
Michael Yang's avatar
Michael Yang committed
80
81
82
83
84
		}
	}

	return nil, errors.New("unknown tensor format")
}