rm BertLayerNorm

Summary: Pull Request resolved: https://github.com/fairinternal/fairseq-py/pull/608 Differential Revision: D15541220 Pulled By: myleott fbshipit-source-id: 52a8e4da72cc6e3e25cf98c989d34a269d614c9d

rm BertLayerNorm
Summary: Pull Request resolved: https://github.com/fairinternal/fairseq-py/pull/608 Differential Revision: D15541220 Pulled By: myleott fbshipit-source-id: 52a8e4da72cc6e3e25cf98c989d34a269d614c9d
3e472b22 · Myle Ott · Facebook Github Bot · ed592ab5 · 3e472b22 · ed592ab5
Commit 3e472b22 authored May 29, 2019 by Myle Ott Committed by Facebook Github Bot May 29, 2019
Show whitespace changes
Inline Side-by-side

Showing with 0 additions and 29 deletions

fairseq/modules/__init__.py fairseq/modules/__init__.py +0 -2

fairseq/modules/bert_layer_norm.py fairseq/modules/bert_layer_norm.py +0 -27

No files found.
--- a/fairseq/modules/__init__.py
+++ b/fairseq/modules/__init__.py
@@ -8,7 +8,6 @@
 from .adaptive_input import AdaptiveInput
 from .adaptive_softmax import AdaptiveSoftmax
 from .beamable_mm import BeamableMM
-from .bert_layer_norm import BertLayerNorm
 from .character_token_embedder import CharacterTokenEmbedder
 from .conv_tbc import ConvTBC
 from .downsampled_multihead_attention import DownsampledMultiHeadAttention
@@ -34,7 +33,6 @@ __all__ = [
    'AdaptiveInput',
    'AdaptiveSoftmax',
    'BeamableMM',
-    'BertLayerNorm',
    'CharacterTokenEmbedder',
    'ConvTBC',
    'DownsampledMultiHeadAttention',

--- a/fairseq/modules/bert_layer_norm.py
+++ b/fairseq/modules/bert_layer_norm.py
-# Copyright (c) 2017-present, Facebook, Inc.
-# All rights reserved.
-#
-# This source code is licensed under the license found in the LICENSE file in
-# the root directory of this source tree. An additional grant of patent rights
-# can be found in the PATENTS file in the same directory.
-import torch
-import torch.nn as nn
-class BertLayerNorm(nn.Module):
-    def __init__(self, hidden_size, eps=1e-12):
-        """
-        Construct a layernorm module in the TF style used with BERT
-        (epsilon inside the square root).
-        """
-        super(BertLayerNorm, self).__init__()
-        self.weight = nn.Parameter(torch.ones(hidden_size))
-        self.bias = nn.Parameter(torch.zeros(hidden_size))
-        self.variance_epsilon = eps
-    def forward(self, x):
-        u = x.mean(-1, keepdim=True)
-        s = (x - u).pow(2).mean(-1, keepdim=True)
-        x = (x - u) / torch.sqrt(s + self.variance_epsilon)
-        return self.weight * x + self.bias