Commit b886b7bb authored by Mohammad Shoeybi's avatar Mohammad Shoeybi
Browse files

created megatron package

parent 4947002d
......@@ -19,7 +19,7 @@ import torch.distributed as dist
from torch.nn.modules import Module
from torch.autograd import Variable
import mpu
from megatron import mpu
class DistributedDataParallel(Module):
......
......@@ -18,7 +18,7 @@
import torch
import torch.nn.functional as F
import mpu
from megatron import mpu
def init_method_normal(std=0.02):
......
......@@ -34,9 +34,9 @@ from torch.nn import CrossEntropyLoss
#from torch.utils.checkpoint import checkpoint
from data_utils.file_utils import cached_path
from megatron.data_utils.file_utils import cached_path
import mpu
from megatron import mpu
def normal_init_method(mean, std):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment