Fix momentum setting in BatchNorm forward pass. (#18764)

author Spandan Tiwari <sptiwari@microsoft.com>

Mon, 8 Apr 2019 23:21:30 +0000 (16:21 -0700)

committer Facebook Github Bot <facebook-github-bot@users.noreply.github.com>

Mon, 8 Apr 2019 23:30:00 +0000 (16:30 -0700)
author Spandan Tiwari <sptiwari@microsoft.com>
Mon, 8 Apr 2019 23:21:30 +0000 (16:21 -0700)
committer Facebook Github Bot <facebook-github-bot@users.noreply.github.com>
Mon, 8 Apr 2019 23:30:00 +0000 (16:30 -0700)
diff --git a/test/onnx/expect/TestOperators.test_batchnorm.expect b/test/onnx/expect/TestOperators.test_batchnorm.expect

index e9edb45..44226c5 100644 (file)
--- a/test/onnx/expect/TestOperators.test_batchnorm.expect
+++ b/test/onnx/expect/TestOperators.test_batchnorm.expect
@@ -17,7 +17,7 @@ graph {
      }
      attribute {
        name: "momentum"
-      f: 1
+      f: 0.9
        type: FLOAT
      }
    }
diff --git a/test/onnx/expect/TestOperators.test_batchnorm_1d.expect b/test/onnx/expect/TestOperators.test_batchnorm_1d.expect

index f3dac32..a8097f1 100644 (file)
--- a/test/onnx/expect/TestOperators.test_batchnorm_1d.expect
+++ b/test/onnx/expect/TestOperators.test_batchnorm_1d.expect
@@ -27,7 +27,7 @@ graph {
      }
      attribute {
        name: "momentum"
-      f: 1
+      f: 0.9
        type: FLOAT
      }
    }
diff --git a/test/onnx/expect/TestOperators.test_batchnorm_noaffine.expect b/test/onnx/expect/TestOperators.test_batchnorm_noaffine.expect

index 6e7b9e7..9f7765a 100644 (file)
--- a/test/onnx/expect/TestOperators.test_batchnorm_noaffine.expect
+++ b/test/onnx/expect/TestOperators.test_batchnorm_noaffine.expect
@@ -43,7 +43,7 @@ graph {
      }
      attribute {
        name: "momentum"
-      f: 1
+      f: 0.7
        type: FLOAT
      }
    }
diff --git a/test/onnx/test_operators.py b/test/onnx/test_operators.py

index 77764f5..0b1fe97 100644 (file)
--- a/test/onnx/test_operators.py
+++ b/test/onnx/test_operators.py
@@ -480,7 +480,7 @@ class TestOperators(TestCase):
  
      def test_batchnorm_noaffine(self):
          x = torch.randn(128, 128, 1, 1, requires_grad=True)
-        self.assertONNX(nn.BatchNorm2d(128, affine=False), x)
+        self.assertONNX(nn.BatchNorm2d(128, affine=False, momentum=0.3), x)
  
      def test_embedding_bags(self):
          emb_bag = nn.EmbeddingBag(10, 8)
diff --git a/torch/nn/modules/batchnorm.py b/torch/nn/modules/batchnorm.py

index 2d2034b..cf360bf 100644 (file)
--- a/torch/nn/modules/batchnorm.py
+++ b/torch/nn/modules/batchnorm.py
@@ -60,7 +60,13 @@ class _BatchNorm(Module):
      def forward(self, input):
          self._check_input_dim(input)
  
-        exponential_average_factor = 0.0
+        # exponential_average_factor is self.momentum set to
+        # (when it is available) only so that if gets updated
+        # in ONNX graph when this node is exported to ONNX.
+        if self.momentum is None:
+            exponential_average_factor = 0.0
+        else:
+            exponential_average_factor = self.momentum
  
          if self.training and self.track_running_stats:
              # TODO: if statement only here to tell the jit to skip emitting this when it is None
author	Spandan Tiwari <sptiwari@microsoft.com>
	Mon, 8 Apr 2019 23:21:30 +0000 (16:21 -0700)
committer	Facebook Github Bot <facebook-github-bot@users.noreply.github.com>
	Mon, 8 Apr 2019 23:30:00 +0000 (16:30 -0700)
test/onnx/expect/TestOperators.test_batchnorm.expect		patch \| blob \| history
test/onnx/expect/TestOperators.test_batchnorm_1d.expect		patch \| blob \| history
test/onnx/expect/TestOperators.test_batchnorm_noaffine.expect		patch \| blob \| history
test/onnx/test_operators.py		patch \| blob \| history
torch/nn/modules/batchnorm.py		patch \| blob \| history