eb8680
diff --git a/‎aten/src/ATen/core/Reduction.h
+1-1 b/‎aten/src/ATen/core/Reduction.h
+1-1
diff --git a/‎aten/src/ATen/native/Loss.cpp
+3-3 b/‎aten/src/ATen/native/Loss.cpp
+3-3
diff --git a/‎aten/src/ATen/native/LossCTC.cpp
+1-1 b/‎aten/src/ATen/native/LossCTC.cpp
+1-1
diff --git a/‎aten/src/ATen/native/cuda/Loss.cu
+1-1 b/‎aten/src/ATen/native/cuda/Loss.cu
+1-1
diff --git a/‎aten/src/ATen/native/native_functions.yaml
+8-8 b/‎aten/src/ATen/native/native_functions.yaml
+8-8
diff --git a/‎aten/src/ATen/nn.yaml
+9-9 b/‎aten/src/ATen/nn.yaml
+9-9
diff --git a/‎aten/src/ATen/test/basic.cpp
+1-1 b/‎aten/src/ATen/test/basic.cpp
+1-1
diff --git a/‎aten/src/THCUNN/generic/AbsCriterion.cu
+2-2 b/‎aten/src/THCUNN/generic/AbsCriterion.cu
+2-2
diff --git a/‎aten/src/THCUNN/generic/BCECriterion.cu
+2-2 b/‎aten/src/THCUNN/generic/BCECriterion.cu
+2-2
diff --git a/‎aten/src/THCUNN/generic/ClassNLLCriterion.cu
+4-4 b/‎aten/src/THCUNN/generic/ClassNLLCriterion.cu
+4-4
diff --git a/‎aten/src/THCUNN/generic/DistKLDivCriterion.cu
+2-2 b/‎aten/src/THCUNN/generic/DistKLDivCriterion.cu
+2-2
diff --git a/‎aten/src/THCUNN/generic/MSECriterion.cu
+2-2 b/‎aten/src/THCUNN/generic/MSECriterion.cu
+2-2
diff --git a/‎aten/src/THCUNN/generic/MultiLabelMarginCriterion.cu
+4-4 b/‎aten/src/THCUNN/generic/MultiLabelMarginCriterion.cu
+4-4
@@ -7,7 +7,7 @@ namespace Reduction {
 // Ideally, this would be a scoped enum, but jit doesn't support that
 enum Reduction {
   None,             // Do not reduce
-  ElementwiseMean,  // Sum losses and take mean over each individually computed loss element
+  Mean,             // (Possibly weighted) mean of losses
   Sum,              // Sum losses
   END
 };
 
@@ -7,7 +7,7 @@
 
 namespace {
   static inline at::Tensor apply_loss_reduction(const at::Tensor& unreduced, int64_t reduction) {
-    if (reduction == Reduction::ElementwiseMean) {
+    if (reduction == Reduction::Mean) {
       return unreduced.mean();
     } else if (reduction == Reduction::Sum) {
       return unreduced.sum();
@@ -81,7 +81,7 @@ Tensor kl_div_backward_cpu(const Tensor& grad, const Tensor& input, const Tensor
           }
         });
   });
-  if (reduction == Reduction::ElementwiseMean) {
+  if (reduction == Reduction::Mean) {
     return grad_input / input.numel();
   }
   return grad_input;
@@ -119,7 +119,7 @@ Tensor binary_cross_entropy_with_logits_backward(const Tensor& grad, const Tenso
         grad_input.mul_(weight);
     }
 
-    if (reduction == Reduction::ElementwiseMean) {
+    if (reduction == Reduction::Mean) {
         return grad_input / input.numel();
     }
 
 
@@ -353,7 +353,7 @@ Tensor ctc_loss(const Tensor& log_probs, const Tensor& targets, IntList input_le
   } else {
     res = std::get<0>(at::_ctc_loss(log_probs, targets, input_lengths, target_lengths, BLANK));
   }
-  if (reduction == Reduction::ElementwiseMean) {
+  if (reduction == Reduction::Mean) {
     auto target_lengths_t = at::tensor(target_lengths, res.options().device(at::Device(at::Device::Type::CPU)).dtype(kLong)).toType(res.type());
     return (res / target_lengths_t).mean();
   } else if (reduction == Reduction::Sum) {
 
@@ -31,7 +31,7 @@ Tensor kl_div_backward_cuda(const Tensor& grad, const Tensor& input, const Tenso
   AT_DISPATCH_FLOATING_TYPES_AND_HALF(input.type(), "kl_div_backward", [&]() {
     kl_div_backward_kernel<scalar_t>(grad_input, target, grad_expand);
   });
-  if (reduction == Reduction::ElementwiseMean) {
+  if (reduction == Reduction::Mean) {
     return grad_input / input.numel();
   }
   return grad_input;
 
@@ -461,7 +461,7 @@
     CPU: _cosh_out_cpu
     CUDA: _cosh_out_cuda
 
-- func: cosine_embedding_loss(Tensor input1, Tensor input2, Tensor target, double margin=0.0, int64_t reduction=Reduction::ElementwiseMean) -> Tensor
+- func: cosine_embedding_loss(Tensor input1, Tensor input2, Tensor target, double margin=0.0, int64_t reduction=Reduction::Mean) -> Tensor
 
 - func: cudnn_affine_grid_generator(Tensor theta, int64_t N, int64_t C, int64_t H, int64_t W) -> Tensor
   return:
@@ -568,10 +568,10 @@
 
 - func: cumprod_out(Tensor result, Tensor self, int64_t dim) -> Tensor
 
-- func: ctc_loss(Tensor log_probs, Tensor targets, IntList input_lengths, IntList target_lengths, int64_t blank=0, int64_t reduction=Reduction::ElementwiseMean) -> Tensor
+- func: ctc_loss(Tensor log_probs, Tensor targets, IntList input_lengths, IntList target_lengths, int64_t blank=0, int64_t reduction=Reduction::Mean) -> Tensor
 
 # convenience function that converts to intlists for you
-- func: ctc_loss(Tensor log_probs, Tensor targets, Tensor input_lengths, Tensor target_lengths, int64_t blank=0, int64_t reduction=Reduction::ElementwiseMean) -> Tensor
+- func: ctc_loss(Tensor log_probs, Tensor targets, Tensor input_lengths, Tensor target_lengths, int64_t blank=0, int64_t reduction=Reduction::Mean) -> Tensor
 
 - func: _ctc_loss(Tensor log_probs, Tensor targets, IntList input_lengths, IntList target_lengths, int64_t blank=0) -> (Tensor, Tensor)
   dispatch:
@@ -831,7 +831,7 @@
 
 - func: hamming_window(int64_t window_length, bool periodic, double alpha, double beta, TensorOptions options={}) -> Tensor
 
-- func: hinge_embedding_loss(Tensor self, Tensor target, double margin=1.0, int64_t reduction=Reduction::ElementwiseMean) -> Tensor
+- func: hinge_embedding_loss(Tensor self, Tensor target, double margin=1.0, int64_t reduction=Reduction::Mean) -> Tensor
 
 - func: ger(Tensor self, Tensor vec2) -> Tensor
   variants: function, method
@@ -937,9 +937,9 @@
   variants: function, method
   device_guard: false
 
-- func: kl_div(Tensor self, Tensor target, int64_t reduction=Reduction::ElementwiseMean) -> Tensor
+- func: kl_div(Tensor self, Tensor target, int64_t reduction=Reduction::Mean) -> Tensor
 
-- func: kl_div_backward(Tensor grad_output, Tensor self, Tensor target, int64_t reduction=Reduction::ElementwiseMean) -> Tensor
+- func: kl_div_backward(Tensor grad_output, Tensor self, Tensor target, int64_t reduction=Reduction::Mean) -> Tensor
   dispatch:
     CPU: kl_div_backward_cpu
     CUDA: kl_div_backward_cuda
@@ -1054,7 +1054,7 @@
 
 - func: logsumexp_out(Tensor result, Tensor self, int64_t dim, bool keepdim=False) -> Tensor
 
-- func: margin_ranking_loss(Tensor input1, Tensor input2, Tensor target, double margin=0.0, int64_t reduction=Reduction::ElementwiseMean) -> Tensor
+- func: margin_ranking_loss(Tensor input1, Tensor input2, Tensor target, double margin=0.0, int64_t reduction=Reduction::Mean) -> Tensor
 
 - func: matmul(Tensor self, Tensor other) -> Tensor
   variants: function, method
@@ -1699,7 +1699,7 @@
 
 - func: _trilinear(Tensor i1, Tensor i2, Tensor i3, IntList expand1, IntList expand2, IntList expand3, IntList sumdim, int64_t unroll_dim=1) -> Tensor
 
-- func: triplet_margin_loss(Tensor anchor, Tensor positive, Tensor negative, double margin=1.0, double p=2, double eps=1e-6, bool swap=false, int64_t reduction=Reduction::ElementwiseMean) -> Tensor
+- func: triplet_margin_loss(Tensor anchor, Tensor positive, Tensor negative, double margin=1.0, double p=2, double eps=1e-6, bool swap=false, int64_t reduction=Reduction::Mean) -> Tensor
 
 - func: trunc(Tensor self) -> Tensor
   variants: function, method
 
@@ -1,52 +1,52 @@
 # Loss functions
 
-- name: binary_cross_entropy(Tensor self, Tensor target, Tensor weight={}, int64_t reduction=Reduction::ElementwiseMean)
+- name: binary_cross_entropy(Tensor self, Tensor target, Tensor weight={}, int64_t reduction=Reduction::Mean)
   cname: BCECriterion
   scalar_check:
     output: reduction != Reduction::None || self_->dim() == 0
 
-- name: l1_loss(Tensor self, Tensor target, int64_t reduction=Reduction::ElementwiseMean)
+- name: l1_loss(Tensor self, Tensor target, int64_t reduction=Reduction::Mean)
   cname: AbsCriterion
   scalar_check:
     output: reduction != Reduction::None || self_->dim() == 0
 
-- name: mse_loss(Tensor self, Tensor target, int64_t reduction=Reduction::ElementwiseMean)
+- name: mse_loss(Tensor self, Tensor target, int64_t reduction=Reduction::Mean)
   cname: MSECriterion
   scalar_check:
     output: reduction != Reduction::None || self_->dim() == 0
 
-- name: multi_margin_loss(Tensor self, LongTensor target, Scalar p=1, Scalar margin=1, Tensor weight={}, int64_t reduction=Reduction::ElementwiseMean)
+- name: multi_margin_loss(Tensor self, LongTensor target, Scalar p=1, Scalar margin=1, Tensor weight={}, int64_t reduction=Reduction::Mean)
   cname: MultiMarginCriterion
   scalar_check:
     output: reduction != Reduction::None || self_->dim() == 0
 
-- name: multilabel_margin_loss(Tensor self, LongTensor target, int64_t reduction=Reduction::ElementwiseMean)
+- name: multilabel_margin_loss(Tensor self, LongTensor target, int64_t reduction=Reduction::Mean)
   cname: MultiLabelMarginCriterion
   buffers: [is_target]
   scalar_check:
     output: reduction != Reduction::None || self_->dim() == 0
     is_target: target_->dim() == 0
 
-- name: nll_loss(Tensor self, LongTensor target, Tensor weight={}, int64_t reduction=Reduction::ElementwiseMean, int64_t ignore_index=-100)
+- name: nll_loss(Tensor self, LongTensor target, Tensor weight={}, int64_t reduction=Reduction::Mean, int64_t ignore_index=-100)
   cname: ClassNLLCriterion
   buffers: [total_weight]
   scalar_check:
     output: reduction != Reduction::None || self_->dim() == 0
     total_weight: 'true'
 
-- name: nll_loss2d(Tensor self, LongTensor target, Tensor weight={}, int64_t reduction=Reduction::ElementwiseMean, int64_t ignore_index=-100)
+- name: nll_loss2d(Tensor self, LongTensor target, Tensor weight={}, int64_t reduction=Reduction::Mean, int64_t ignore_index=-100)
   cname: SpatialClassNLLCriterion
   buffers: [total_weight]
   scalar_check:
     output: reduction != Reduction::None || self_->dim() == 0
     total_weight: 'true'
 
-- name: smooth_l1_loss(Tensor self, Tensor target, int64_t reduction=Reduction::ElementwiseMean)
+- name: smooth_l1_loss(Tensor self, Tensor target, int64_t reduction=Reduction::Mean)
   cname: SmoothL1Criterion
   scalar_check:
     output: reduction != Reduction::None || self_->dim() == 0
 
-- name: soft_margin_loss(Tensor self, Tensor target, int64_t reduction=Reduction::ElementwiseMean)
+- name: soft_margin_loss(Tensor self, Tensor target, int64_t reduction=Reduction::Mean)
   cname: SoftMarginCriterion
   scalar_check:
     output: reduction != Reduction::None || self_->dim() == 0
 
@@ -271,7 +271,7 @@ static void test(Type& type) {
   CATCH_SECTION("dispatch") {
     Tensor tensor = randn({20, 20});
     Tensor other = randn({20, 20});
-    auto result = tensor.m(relu).m(mse_loss, other, Reduction::ElementwiseMean);
+    auto result = tensor.m(relu).m(mse_loss, other, Reduction::Mean);
     CATCH_REQUIRE(result.allclose(mse_loss(relu(tensor), other)));
   }
   CATCH_SECTION("core") {
 
@@ -30,7 +30,7 @@ void THNN_(AbsCriterion_updateOutput)(
   thrust::device_ptr<scalar_t> target_data(THCTensor_(data)(state, target));
   accreal sum = thrust::inner_product(input_data, input_data+size, target_data, (accreal)0, thrust::plus<accreal>(), abs_functor<scalar_t, accreal>());
 
-  if (reduction == Reduction::ElementwiseMean)
+  if (reduction == Reduction::Mean)
     sum /= size;
 
   THCTensor_(free)(state, input);
@@ -63,7 +63,7 @@ void THNN_(AbsCriterion_updateGradInput)(
   THCUNN_check_dim_size(state, gradOutput, 1, 0, 1);
 
   ptrdiff_t size = THCTensor_(nElement)(state, input);
-  scalar_t norm = ScalarConvert<double, scalar_t>::to(reduction == Reduction::ElementwiseMean ? 1./size : 1.);
+  scalar_t norm = ScalarConvert<double, scalar_t>::to(reduction == Reduction::Mean ? 1./size : 1.);
 
   input = THCTensor_(newContiguous)(state, input);
   target = THCTensor_(newContiguous)(state, target);
 
@@ -57,7 +57,7 @@ void THNN_(BCECriterion_updateOutput)(
     );
   }
 
-  if (reduction == Reduction::ElementwiseMean)
+  if (reduction == Reduction::Mean)
     sum /= size;
 
   THCTensor_(free)(state, input);
@@ -95,7 +95,7 @@ void THNN_(BCECriterion_updateGradInput)(
   THCUNN_check_dim_size(state, gradOutput, 1, 0, 1);
 
   ptrdiff_t size = THCTensor_(nElement)(state, input);
-  scalar_t norm = ScalarConvert<accreal, scalar_t>::to((reduction == Reduction::ElementwiseMean ? accreal(1)/size : accreal(1)) * THCTensor_(get1d)(state, gradOutput, 0));
+  scalar_t norm = ScalarConvert<accreal, scalar_t>::to((reduction == Reduction::Mean ? accreal(1)/size : accreal(1)) * THCTensor_(get1d)(state, gradOutput, 0));
 
   input = THCTensor_(newContiguous)(state, input);
   target = THCTensor_(newContiguous)(state, target);
 
@@ -88,7 +88,7 @@ void THNN_(ClassNLLCriterion_updateOutput)(
         input_data,
         target_data,
         weights_data,
-        reduction == Reduction::ElementwiseMean,
+        reduction == Reduction::Mean,
         n_classes,
         ignore_index
     );
@@ -101,7 +101,7 @@ void THNN_(ClassNLLCriterion_updateOutput)(
         input_data,
         target_data,
         weights_data,
-        reduction == Reduction::ElementwiseMean,
+        reduction == Reduction::Mean,
         THCTensor_(size)(state, input, 0),
         THCTensor_(size)(state, input, 1),
         n_classes,
@@ -205,7 +205,7 @@ void THNN_(ClassNLLCriterion_updateGradInput)(
         weights_data,
         target_data,
         total_weight_data,
-        reduction == Reduction::ElementwiseMean,
+        reduction == Reduction::Mean,
         n_classes,
         ignore_index
     );
@@ -217,7 +217,7 @@ void THNN_(ClassNLLCriterion_updateGradInput)(
         target_data,
         weights_data,
         total_weight_data,
-        reduction == Reduction::ElementwiseMean,
+        reduction == Reduction::Mean,
         THCTensor_(size)(state, input, 0),
         THCTensor_(size)(state, input, 1),
         n_classes,
 
@@ -35,7 +35,7 @@ void THNN_(DistKLDivCriterion_updateOutput)(
   thrust::device_ptr<scalar_t> target_data(THCTensor_(data)(state, target));
   sum = thrust::inner_product(input_data, input_data+size, target_data, (accreal) 0, thrust::plus<accreal>(), kl_functor<scalar_t, accreal>());
 
-  if (reduction == Reduction::ElementwiseMean)
+  if (reduction == Reduction::Mean)
     sum /= size;
 
   THCTensor_(free)(state, input);
@@ -70,7 +70,7 @@ void THNN_(DistKLDivCriterion_updateGradInput)(
   THCUNN_check_dim_size(state, gradOutput, 1, 0, 1);
 
   ptrdiff_t size = THCTensor_(nElement)(state, input);
-  scalar_t norm = (reduction == Reduction::ElementwiseMean ? ScalarConvert<accreal, scalar_t>::to(accreal(1)/size) : ScalarConvert<int, scalar_t>::to(1));
+  scalar_t norm = (reduction == Reduction::Mean ? ScalarConvert<accreal, scalar_t>::to(accreal(1)/size) : ScalarConvert<int, scalar_t>::to(1));
 
   input = THCTensor_(newContiguous)(state, input);
   target = THCTensor_(newContiguous)(state, target);
 
@@ -30,7 +30,7 @@ void THNN_(MSECriterion_updateOutput)(
       input_data, input_data+size, target_data, (accreal) 0,
       thrust::plus<accreal>(), mse_functor<scalar_t, accreal>());
 
-    if (reduction == Reduction::ElementwiseMean)
+    if (reduction == Reduction::Mean)
       sum /= size;
 
     THCTensor_(free)(state, input);
@@ -64,7 +64,7 @@ void THNN_(MSECriterion_updateGradInput)(
     ptrdiff_t size = THCTensor_(nElement)(state, input);
 
     THCUNN_check_dim_size(state, gradOutput, 1, 0, 1);
-    accreal norm = reduction == Reduction::ElementwiseMean ? (accreal)(2)/size : (accreal)(2);
+    accreal norm = reduction == Reduction::Mean ? (accreal)(2)/size : (accreal)(2);
     norm *= ScalarConvert<scalar_t, accreal>::to(THCTensor_(get1d)(state, gradOutput, 0));
 
     input = THCTensor_(newContiguous)(state, input);
 
@@ -33,7 +33,7 @@ void THNN_(MultiLabelMarginCriterion_updateOutput)(
         THCIndexTensor_(data)(state, target),
         THCTensor_(data)(state, istarget),
         1, dim,
-        reduction == Reduction::ElementwiseMean
+        reduction == Reduction::Mean
         );
     THCudaCheck(cudaGetLastError());
   }
@@ -59,7 +59,7 @@ void THNN_(MultiLabelMarginCriterion_updateOutput)(
           THCIndexTensor_(data)(state, target),
           THCTensor_(data)(state, istarget),
           nframe, dim,
-          reduction == Reduction::ElementwiseMean
+          reduction == Reduction::Mean
           );
       THCudaCheck(cudaGetLastError());
       THCTensor_(set1d)(state, output, 0, ScalarConvert<accreal, scalar_t>::to(THCTensor_(sumall)(state, output_tmp)));
@@ -122,7 +122,7 @@ void THNN_(MultiLabelMarginCriterion_updateGradInput)(
         THCIndexTensor_(data)(state, target),
         THCTensor_(data)(state, istarget),
         1, gradInput->size(0),
-        reduction == Reduction::ElementwiseMean,
+        reduction == Reduction::Mean,
         reduction != Reduction::None);
 
   }
@@ -145,7 +145,7 @@ void THNN_(MultiLabelMarginCriterion_updateGradInput)(
         THCIndexTensor_(data)(state, target),
         THCTensor_(data)(state, istarget),
         gradInput->size(0), gradInput->size(1),
-        reduction == Reduction::ElementwiseMean,
+        reduction == Reduction::Mean,
         reduction != Reduction::None);
   }
   else
Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@`
`7`	`7`
`8`	`8`	`namespace {`
`9`	`9`	`static inline at::Tensor apply_loss_reduction(const at::Tensor& unreduced, int64_t reduction) {`
`10`		`- if (reduction == Reduction::ElementwiseMean) {`
	`10`	`+ if (reduction == Reduction::Mean) {`
`11`	`11`	`return unreduced.mean();`
`12`	`12`	`} else if (reduction == Reduction::Sum) {`
`13`	`13`	`return unreduced.sum();`
`@@ -81,7 +81,7 @@ Tensor kl_div_backward_cpu(const Tensor& grad, const Tensor& input, const Tensor`
`81`	`81`	`}`
`82`	`82`	`});`
`83`	`83`	`});`
`84`		`- if (reduction == Reduction::ElementwiseMean) {`
	`84`	`+ if (reduction == Reduction::Mean) {`
`85`	`85`	`return grad_input / input.numel();`
`86`	`86`	`}`
`87`	`87`	`return grad_input;`
`@@ -119,7 +119,7 @@ Tensor binary_cross_entropy_with_logits_backward(const Tensor& grad, const Tenso`
`119`	`119`	`grad_input.mul_(weight);`
`120`	`120`	`}`
`121`	`121`
`122`		`- if (reduction == Reduction::ElementwiseMean) {`
	`122`	`+ if (reduction == Reduction::Mean) {`
`123`	`123`	`return grad_input / input.numel();`
`124`	`124`	`}`
`125`	`125`
Original file line number	Diff line number	Diff line change
`@@ -353,7 +353,7 @@ Tensor ctc_loss(const Tensor& log_probs, const Tensor& targets, IntList input_le`
`353`	`353`	`} else {`
`354`	`354`	`res = std::get<0>(at::_ctc_loss(log_probs, targets, input_lengths, target_lengths, BLANK));`
`355`	`355`	`}`
`356`		`- if (reduction == Reduction::ElementwiseMean) {`
	`356`	`+ if (reduction == Reduction::Mean) {`
`357`	`357`	`auto target_lengths_t = at::tensor(target_lengths, res.options().device(at::Device(at::Device::Type::CPU)).dtype(kLong)).toType(res.type());`
`358`	`358`	`return (res / target_lengths_t).mean();`
`359`	`359`	`} else if (reduction == Reduction::Sum) {`
Original file line number	Diff line number	Diff line change
`@@ -31,7 +31,7 @@ Tensor kl_div_backward_cuda(const Tensor& grad, const Tensor& input, const Tenso`
`31`	`31`	`AT_DISPATCH_FLOATING_TYPES_AND_HALF(input.type(), "kl_div_backward", [&]() {`
`32`	`32`	`kl_div_backward_kernel<scalar_t>(grad_input, target, grad_expand);`
`33`	`33`	`});`
`34`		`- if (reduction == Reduction::ElementwiseMean) {`
	`34`	`+ if (reduction == Reduction::Mean) {`
`35`	`35`	`return grad_input / input.numel();`
`36`	`36`	`}`
`37`	`37`	`return grad_input;`
Original file line number	Diff line number	Diff line change
`@@ -271,7 +271,7 @@ static void test(Type& type) {`
`271`	`271`	`CATCH_SECTION("dispatch") {`
`272`	`272`	`Tensor tensor = randn({20, 20});`
`273`	`273`	`Tensor other = randn({20, 20});`
`274`		`- auto result = tensor.m(relu).m(mse_loss, other, Reduction::ElementwiseMean);`
	`274`	`+ auto result = tensor.m(relu).m(mse_loss, other, Reduction::Mean);`
`275`	`275`	`CATCH_REQUIRE(result.allclose(mse_loss(relu(tensor), other)));`
`276`	`276`	`}`
`277`	`277`	`CATCH_SECTION("core") {`