tokenizer_GPTJ.py 245 Bytes
Newer Older
yangzhong's avatar
yangzhong committed
1
2
3
4
5
6
7
8
9
10
from transformers import AutoTokenizer


def get_transformer_autotokenizer(model_name: str):
    return AutoTokenizer.from_pretrained(
        model_name,
        model_max_length=2048,
        padding_side="left",
        use_fast=False,
    )