reader.go 1.73 KB
Newer Older
Michael Yang's avatar
Michael Yang committed
1
2
3
4
5
package convert

import (
	"errors"
	"io"
6
	"io/fs"
Michael Yang's avatar
Michael Yang committed
7
8
9
10
11
12
13
	"strings"
)

type Tensor interface {
	Name() string
	Shape() []uint64
	Kind() uint32
Michael Yang's avatar
llama4  
Michael Yang committed
14
	SetRepacker(Repacker)
Michael Yang's avatar
Michael Yang committed
15
	WriteTo(io.Writer) (int64, error)
Michael Yang's avatar
llama4  
Michael Yang committed
16
	Clone() Tensor
Michael Yang's avatar
Michael Yang committed
17
18
19
}

type tensorBase struct {
Michael Yang's avatar
llama4  
Michael Yang committed
20
21
22
	name     string
	shape    []uint64
	repacker Repacker
Michael Yang's avatar
Michael Yang committed
23
24
25
26
27
28
29
30
31
32
}

func (t tensorBase) Name() string {
	return t.name
}

func (t tensorBase) Shape() []uint64 {
	return t.shape
}

Michael Yang's avatar
Michael Yang committed
33
const (
Michael Yang's avatar
Michael Yang committed
34
35
36
37
	tensorKindFP32 uint32 = iota
	tensorKindFP16
	tensorKindMXFP4 = 4
	tensorKindBF16  = 30
Michael Yang's avatar
Michael Yang committed
38
39
)

Michael Yang's avatar
Michael Yang committed
40
func (t tensorBase) Kind() uint32 {
Michael Yang's avatar
Michael Yang committed
41
	if strings.HasSuffix(t.name, ".ffn_gate_inp.weight") ||
Michael Yang's avatar
llama4  
Michael Yang committed
42
		t.name == "token_types.weight" ||
43
44
45
46
		t.name == "v.positional_embedding_vlm" ||
		t.name == "v.tile_position_embd.weight" ||
		t.name == "v.pre_tile_position_embd.weight" ||
		t.name == "v.post_tile_position_embd.weight" {
Michael Yang's avatar
Michael Yang committed
47
		// these tensors are always F32
Michael Yang's avatar
Michael Yang committed
48
		return tensorKindFP32
Michael Yang's avatar
Michael Yang committed
49
50
51
52
53
54
	}

	switch len(t.shape) {
	case 0:
		panic("invalid tensor shape")
	case 1:
Michael Yang's avatar
Michael Yang committed
55
		return tensorKindFP32
Michael Yang's avatar
Michael Yang committed
56
	default:
Michael Yang's avatar
Michael Yang committed
57
		return tensorKindFP16
Michael Yang's avatar
Michael Yang committed
58
59
60
	}
}

Michael Yang's avatar
llama4  
Michael Yang committed
61
func (t *tensorBase) SetRepacker(fn Repacker) {
Michael Yang's avatar
Michael Yang committed
62
63
64
	t.repacker = fn
}

Michael Yang's avatar
llama4  
Michael Yang committed
65
type Repacker func(string, []float32, []uint64) ([]float32, error)
Michael Yang's avatar
Michael Yang committed
66

Michael Yang's avatar
Michael Yang committed
67
func parseTensors(fsys fs.FS, replacer *strings.Replacer) ([]Tensor, error) {
Michael Yang's avatar
Michael Yang committed
68
69
	patterns := []struct {
		Pattern string
Michael Yang's avatar
Michael Yang committed
70
		Func    func(fs.FS, *strings.Replacer, ...string) ([]Tensor, error)
Michael Yang's avatar
Michael Yang committed
71
	}{
72
		{"*.safetensors", parseSafetensors},
Michael Yang's avatar
Michael Yang committed
73
74
75
		{"pytorch_model-*-of-*.bin", parseTorch},
		{"pytorch_model.bin", parseTorch},
		{"consolidated.*.pth", parseTorch},
Michael Yang's avatar
Michael Yang committed
76
77
	}

Michael Yang's avatar
Michael Yang committed
78
79
	for _, pattern := range patterns {
		matches, err := fs.Glob(fsys, pattern.Pattern)
Michael Yang's avatar
Michael Yang committed
80
81
82
83
84
		if err != nil {
			return nil, err
		}

		if len(matches) > 0 {
Michael Yang's avatar
Michael Yang committed
85
			return pattern.Func(fsys, replacer, matches...)
Michael Yang's avatar
Michael Yang committed
86
87
88
89
90
		}
	}

	return nil, errors.New("unknown tensor format")
}