phi.py 469 Bytes
Newer Older
yangql's avatar
yangql committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
from ._base import BaseGPTQForCausalLM


class PhiGPTQForCausalLM(BaseGPTQForCausalLM):
    layer_type = "PhiDecoderLayer"
    layers_block_name = "model.layers"
    outside_layer_modules = ["model.embed_tokens", "model.final_layernorm"]
    inside_layer_modules = [
        ["self_attn.q_proj"],
        ["self_attn.k_proj"],
        ["self_attn.v_proj"],
        ["self_attn.dense"],
        ["mlp.fc1"],
        ["mlp.fc2"],
    ]


__all__ = ["PhiGPTQForCausalLM"]