reader.go 1.68 KB
Newer Older
Michael Yang's avatar
Michael Yang committed
1
2
3
4
5
package convert

import (
	"errors"
	"io"
6
	"io/fs"
Michael Yang's avatar
Michael Yang committed
7
8
9
10
11
12
13
	"strings"
)

type Tensor interface {
	Name() string
	Shape() []uint64
	Kind() uint32
Michael Yang's avatar
llama4  
Michael Yang committed
14
	SetRepacker(Repacker)
Michael Yang's avatar
Michael Yang committed
15
	WriteTo(io.Writer) (int64, error)
Michael Yang's avatar
llama4  
Michael Yang committed
16
	Clone() Tensor
Michael Yang's avatar
Michael Yang committed
17
18
19
}

type tensorBase struct {
Michael Yang's avatar
llama4  
Michael Yang committed
20
21
22
	name     string
	shape    []uint64
	repacker Repacker
Michael Yang's avatar
Michael Yang committed
23
24
25
26
27
28
29
30
31
32
}

func (t tensorBase) Name() string {
	return t.name
}

func (t tensorBase) Shape() []uint64 {
	return t.shape
}

Michael Yang's avatar
Michael Yang committed
33
34
35
36
37
const (
	tensorKindF32 uint32 = iota
	tensorKindF16
)

Michael Yang's avatar
Michael Yang committed
38
func (t tensorBase) Kind() uint32 {
Michael Yang's avatar
Michael Yang committed
39
	if strings.HasSuffix(t.name, ".ffn_gate_inp.weight") ||
Michael Yang's avatar
llama4  
Michael Yang committed
40
		t.name == "token_types.weight" ||
41
42
43
44
		t.name == "v.positional_embedding_vlm" ||
		t.name == "v.tile_position_embd.weight" ||
		t.name == "v.pre_tile_position_embd.weight" ||
		t.name == "v.post_tile_position_embd.weight" {
Michael Yang's avatar
Michael Yang committed
45
		// these tensors are always F32
Michael Yang's avatar
bert  
Michael Yang committed
46
		return 0
Michael Yang's avatar
Michael Yang committed
47
48
49
50
51
52
	}

	switch len(t.shape) {
	case 0:
		panic("invalid tensor shape")
	case 1:
Michael Yang's avatar
Michael Yang committed
53
		return tensorKindF32
Michael Yang's avatar
Michael Yang committed
54
	default:
Michael Yang's avatar
Michael Yang committed
55
		return tensorKindF16
Michael Yang's avatar
Michael Yang committed
56
57
58
	}
}

Michael Yang's avatar
llama4  
Michael Yang committed
59
func (t *tensorBase) SetRepacker(fn Repacker) {
Michael Yang's avatar
Michael Yang committed
60
61
62
	t.repacker = fn
}

Michael Yang's avatar
llama4  
Michael Yang committed
63
type Repacker func(string, []float32, []uint64) ([]float32, error)
Michael Yang's avatar
Michael Yang committed
64

Michael Yang's avatar
Michael Yang committed
65
func parseTensors(fsys fs.FS, replacer *strings.Replacer) ([]Tensor, error) {
Michael Yang's avatar
Michael Yang committed
66
67
	patterns := []struct {
		Pattern string
Michael Yang's avatar
Michael Yang committed
68
		Func    func(fs.FS, *strings.Replacer, ...string) ([]Tensor, error)
Michael Yang's avatar
Michael Yang committed
69
	}{
70
		{"*.safetensors", parseSafetensors},
Michael Yang's avatar
Michael Yang committed
71
72
73
		{"pytorch_model-*-of-*.bin", parseTorch},
		{"pytorch_model.bin", parseTorch},
		{"consolidated.*.pth", parseTorch},
Michael Yang's avatar
Michael Yang committed
74
75
	}

Michael Yang's avatar
Michael Yang committed
76
77
	for _, pattern := range patterns {
		matches, err := fs.Glob(fsys, pattern.Pattern)
Michael Yang's avatar
Michael Yang committed
78
79
80
81
82
		if err != nil {
			return nil, err
		}

		if len(matches) > 0 {
Michael Yang's avatar
Michael Yang committed
83
			return pattern.Func(fsys, replacer, matches...)
Michael Yang's avatar
Michael Yang committed
84
85
86
87
88
		}
	}

	return nil, errors.New("unknown tensor format")
}