sft_trainer.py 1.24 KB
Newer Older
shihm's avatar
uodata  
shihm committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
# Copyright 2025 the LlamaFactory team.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


from ..accelerator.interface import DistributedInterface
from ..config.arg_parser import get_args
from ..core.base_trainer import BaseTrainer
from ..core.data_engine import DataEngine
from ..core.model_loader import ModelLoader


class SFTTrainer(BaseTrainer):
    pass


def run_sft(user_args):
    model_args, data_args, training_args, _ = get_args(user_args)
    DistributedInterface(training_args.dist_config)
    data_engine = DataEngine(data_args)
    model_loader = ModelLoader(model_args)
    trainer = SFTTrainer(
        args=training_args,
        model=model_loader.model,
        processor=model_loader.processor,
        dataset=data_engine,
    )
    trainer.fit()