Commit b886b7bb authored by Mohammad Shoeybi's avatar Mohammad Shoeybi
Browse files

created megatron package

parent 4947002d
...@@ -19,7 +19,7 @@ import torch.distributed as dist ...@@ -19,7 +19,7 @@ import torch.distributed as dist
from torch.nn.modules import Module from torch.nn.modules import Module
from torch.autograd import Variable from torch.autograd import Variable
import mpu from megatron import mpu
class DistributedDataParallel(Module): class DistributedDataParallel(Module):
......
...@@ -18,7 +18,7 @@ ...@@ -18,7 +18,7 @@
import torch import torch
import torch.nn.functional as F import torch.nn.functional as F
import mpu from megatron import mpu
def init_method_normal(std=0.02): def init_method_normal(std=0.02):
......
...@@ -34,9 +34,9 @@ from torch.nn import CrossEntropyLoss ...@@ -34,9 +34,9 @@ from torch.nn import CrossEntropyLoss
#from torch.utils.checkpoint import checkpoint #from torch.utils.checkpoint import checkpoint
from data_utils.file_utils import cached_path from megatron.data_utils.file_utils import cached_path
import mpu from megatron import mpu
def normal_init_method(mean, std): def normal_init_method(mean, std):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment