Fix batch norm multiplier init (#12325) Summary: Fixes #12259 Pull Request resolved: https://github.com/pytorch/pytorch/pull/12325 Differential Revision: D10203439 Pulled By: SsnL fbshipit-source-id: 999cc134a45e2554313adb7eb93ee98e1f84335f

commit: c9be135bb9284461d0ec377cb71c0e796fcb5090 [log] [tgz]
author: Kaixhin <design@kaixhin.com> Thu Nov 08 18:58:03 2018 -0800
committer: Facebook Github Bot <facebook-github-bot@users.noreply.github.com> Thu Nov 08 19:00:00 2018 -0800
tree: b16606fb855b350bf7ab52e49d12c93a1174ec0a
parent: 42001e7c17ffa80c00377ab9d07650241fa4713f [diff]
diff --git a/torch/nn/modules/batchnorm.py b/torch/nn/modules/batchnorm.py
index deb280a..393e44b 100644
--- a/torch/nn/modules/batchnorm.py
+++ b/torch/nn/modules/batchnorm.py

@@ -43,7 +43,7 @@
     def reset_parameters(self):
         self.reset_running_stats()
         if self.affine:
-            init.uniform_(self.weight)
+            init.ones_(self.weight)
             init.zeros_(self.bias)
 
     def _check_input_dim(self, input):
@@ -97,8 +97,8 @@
 
     The mean and standard-deviation are calculated per-dimension over
     the mini-batches and :math:`\gamma` and :math:`\beta` are learnable parameter vectors
-    of size `C` (where `C` is the input size). By default, the elements of :math:`\gamma` are sampled
-    from :math:`\mathcal{U}(0, 1)` and the elements of :math:`\beta` are set to 0.
+    of size `C` (where `C` is the input size). By default, the elements of :math:`\gamma` are set
+    to 1 and the elements of :math:`\beta` are set to 0.
 
     Also by default, during training this layer keeps running estimates of its
     computed mean and variance, which are then used for normalization during
@@ -169,8 +169,8 @@
 
     The mean and standard-deviation are calculated per-dimension over
     the mini-batches and :math:`\gamma` and :math:`\beta` are learnable parameter vectors
-    of size `C` (where `C` is the input size). By default, the elements of :math:`\gamma` are sampled
-    from :math:`\mathcal{U}(0, 1)` and the elements of :math:`\beta` are set to 0.
+    of size `C` (where `C` is the input size). By default, the elements of :math:`\gamma` are set
+    to 1 and the elements of :math:`\beta` are set to 0.
 
     Also by default, during training this layer keeps running estimates of its
     computed mean and variance, which are then used for normalization during
@@ -241,8 +241,8 @@
 
     The mean and standard-deviation are calculated per-dimension over
     the mini-batches and :math:`\gamma` and :math:`\beta` are learnable parameter vectors
-    of size `C` (where `C` is the input size). By default, the elements of :math:`\gamma` are sampled
-    from :math:`\mathcal{U}(0, 1)` and the elements of :math:`\beta` are set to 0.
+    of size `C` (where `C` is the input size). By default, the elements of :math:`\gamma` are set
+    to 1 and the elements of :math:`\beta` are set to 0.
 
     Also by default, during training this layer keeps running estimates of its
     computed mean and variance, which are then used for normalization during
commit	c9be135bb9284461d0ec377cb71c0e796fcb5090	[log] [tgz]
author	Kaixhin <design@kaixhin.com>	Thu Nov 08 18:58:03 2018 -0800
committer	Facebook Github Bot <facebook-github-bot@users.noreply.github.com>	Thu Nov 08 19:00:00 2018 -0800
tree	b16606fb855b350bf7ab52e49d12c93a1174ec0a
parent	42001e7c17ffa80c00377ab9d07650241fa4713f [diff]