utils.py 656 Bytes
Newer Older
Rick Ho's avatar
Rick Ho committed
1
2
3
r"""
Utility in Megatron
"""
Jiezhong Qiu's avatar
Jiezhong Qiu committed
4
5
6

import argparse

Rick Ho's avatar
Rick Ho committed
7
8
9
10
def add_fmoe_args(parser):
    group = parser.add_argument_group(title="fastmoe")

    group.add_argument("--fmoefy", action="store_true")
Jiezhong Qiu's avatar
Jiezhong Qiu committed
11
12
13
14
    try:
        group.add_argument("--num-experts", type=int, default=None)
    except argparse.ArgumentError:
        group.add_argument("--fmoe-num-experts", type=int, default=None)
Rick Ho's avatar
Rick Ho committed
15
16
17
    group.add_argument("--top-k", type=int, default=2)
    group.add_argument("--balance-loss-weight", type=float, default=1)
    group.add_argument("--balance-strategy", type=str, default=None)
Sengxian's avatar
Sengxian committed
18
    group.add_argument("--hidden-hidden-size", type=int, default=None)
Rick Ho's avatar
Rick Ho committed
19
20

    return parser