pytorch
diff --git a/‎.circleci/config.yml‎
Lines changed: 1 addition & 1 deletion b/‎.circleci/config.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.circleci/verbatim-sources/pytorch-job-specs.yml‎
Lines changed: 1 addition & 1 deletion b/‎.circleci/verbatim-sources/pytorch-job-specs.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎aten/src/ATen/AccumulateType.h‎
Lines changed: 2 additions & 0 deletions b/‎aten/src/ATen/AccumulateType.h‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎aten/src/ATen/Declarations.cwrap‎
Lines changed: 0 additions & 14 deletions b/‎aten/src/ATen/Declarations.cwrap‎
Lines changed: 0 additions & 14 deletions
diff --git a/‎aten/src/ATen/core/DistributionsHelper.h‎
Lines changed: 7 additions & 7 deletions b/‎aten/src/ATen/core/DistributionsHelper.h‎
Lines changed: 7 additions & 7 deletions
diff --git a/‎aten/src/ATen/core/TransformationHelper.h‎
Lines changed: 7 additions & 5 deletions b/‎aten/src/ATen/core/TransformationHelper.h‎
Lines changed: 7 additions & 5 deletions
diff --git a/‎aten/src/ATen/cpu/vec256/vec256_base.h‎
Lines changed: 1 addition & 1 deletion b/‎aten/src/ATen/cpu/vec256/vec256_base.h‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎aten/src/ATen/function_wrapper.py‎
Lines changed: 20 additions & 14 deletions b/‎aten/src/ATen/function_wrapper.py‎
Lines changed: 20 additions & 14 deletions
diff --git a/‎aten/src/ATen/native/DistributionTemplates.h‎
Lines changed: 2 additions & 1 deletion b/‎aten/src/ATen/native/DistributionTemplates.h‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎aten/src/ATen/native/Pow.cpp‎
Lines changed: 21 additions & 4 deletions b/‎aten/src/ATen/native/Pow.cpp‎
Lines changed: 21 additions & 4 deletions
@@ -509,7 +509,7 @@ jobs:
             if [ "${BUILD_ENVIRONMENT}" == "pytorch-linux-bionic-py3.6-clang9-test" ]; then
               return 0
             fi
-            if [ "${BUILD_ENVIRONMENT}" == "pytorch-linux-xenial-py3.6-gcc-5.4-test" ]; then
+            if [ "${BUILD_ENVIRONMENT}" == "pytorch-linux-xenial-py3.6-gcc5.4-test" ]; then
               return 0
             fi
             return 1
 
@@ -114,7 +114,7 @@ jobs:
             if [ "${BUILD_ENVIRONMENT}" == "pytorch-linux-bionic-py3.6-clang9-test" ]; then
               return 0
             fi
-            if [ "${BUILD_ENVIRONMENT}" == "pytorch-linux-xenial-py3.6-gcc-5.4-test" ]; then
+            if [ "${BUILD_ENVIRONMENT}" == "pytorch-linux-xenial-py3.6-gcc5.4-test" ]; then
               return 0
             fi
             return 1
 
@@ -37,6 +37,8 @@ template <> struct AccumulateType<bool, true> {using type = bool; };
 template <> struct AccumulateType<BFloat16, false> { using type = float; };
 template <> struct AccumulateType<std::complex<float>, false> { using type = std::complex<double>; };
 template <> struct AccumulateType<std::complex<double>, false> { using type = std::complex<double>; };
+template <> struct AccumulateType<c10::complex<float>, false> { using type = c10::complex<double>; };
+template <> struct AccumulateType<c10::complex<double>, false> { using type = c10::complex<double>; };
 template <> struct AccumulateType<float, false> { using type = double; };
 template <> struct AccumulateType<double, false> { using type = double; };
 template <> struct AccumulateType<int8_t, false> { using type = int64_t; };
 
@@ -348,20 +348,6 @@
       output: True
     - THTensor* self
 ]]
-[[
-  name: _th_atan
-  cname: atan
-  types:
-    - floating_point
-  backends:
-    - CUDA
-  variants: function
-  return: argument 0
-  arguments:
-    - arg: THTensor* result
-      output: True
-    - THTensor* self
-]]
 [[
   name: _th_erfc
   cname: erfc
 
@@ -57,9 +57,9 @@ struct uniform_int_from_to_distribution {
       std::is_same<T, float>::value ||
       std::is_same<T, at::BFloat16>::value) && range_ >= 1ULL << 32)
     {
-      return uniform_int_from_to_transformation<T>(generator->random64(), range_, base_);
+      return transformation::uniform_int_from_to<T>(generator->random64(), range_, base_);
     } else {
-      return uniform_int_from_to_transformation<T>(generator->random(), range_, base_);
+      return transformation::uniform_int_from_to<T>(generator->random(), range_, base_);
     }
   }
 
@@ -76,7 +76,7 @@ struct uniform_int_full_range_distribution {
 
   template <typename RNG>
   C10_HOST_DEVICE inline T operator()(RNG generator) {
-    return uniform_int_full_range_transformation<T>(generator->random64());
+    return transformation::uniform_int_full_range<T>(generator->random64());
   }
 
 };
@@ -91,9 +91,9 @@ struct uniform_int_distribution {
   template <typename RNG>
   C10_HOST_DEVICE inline T operator()(RNG generator) {
     if (std::is_same<T, double>::value || std::is_same<T, int64_t>::value) {
-      return uniform_int_transformation<T>(generator->random64());
+      return transformation::uniform_int<T>(generator->random64());
     } else {
-      return uniform_int_transformation<T>(generator->random());
+      return transformation::uniform_int<T>(generator->random());
     }
   }
 
@@ -115,9 +115,9 @@ struct uniform_real_distribution {
   template <typename RNG>
   C10_HOST_DEVICE inline dist_acctype<T> operator()(RNG generator){
     if(std::is_same<T, double>::value) {
-      return uniform_real_transformation<T>(generator->random64(), from_, to_);
+      return transformation::uniform_real<T>(generator->random64(), from_, to_);
     } else {
-      return uniform_real_transformation<T>(generator->random(), from_, to_);
+      return transformation::uniform_real<T>(generator->random(), from_, to_);
     }
   }
 
 
@@ -25,29 +25,31 @@ template <> struct DistAccumType<double> { using type = double; };
 template <typename T>
 using dist_acctype = typename DistAccumType<T>::type;
 
+namespace transformation {
+
 /**
  * A transformation function for `torch.Tensor.random_()`, when both `from` and `to` are specified.
  * `range` is `to - from`
  * `base` is `from`
  */
 template <typename T, typename V>
-C10_HOST_DEVICE inline T uniform_int_from_to_transformation(V val, uint64_t range, int64_t base) {
+C10_HOST_DEVICE inline T uniform_int_from_to(V val, uint64_t range, int64_t base) {
   return static_cast<T>(static_cast<int64_t>((val % range) + base));
 }
 
 /**
  * A transformation function for `torch.Tensor.random_()`, when `from=min_value(int64_t)` and to=None
  */
 template <typename T, typename V>
-C10_HOST_DEVICE inline T uniform_int_full_range_transformation(V val) {
+C10_HOST_DEVICE inline T uniform_int_full_range(V val) {
   return static_cast<T>(static_cast<int64_t>(val));
 }
 
 /**
  * A transformation function for `torch.Tensor.random_()`, when used without specifying `from` and `to`.
  */
 template <typename T, typename V>
-C10_HOST_DEVICE inline T uniform_int_transformation(V val) {
+C10_HOST_DEVICE inline T uniform_int(V val) {
   if (std::is_same<T, bool>::value) {
     return static_cast<bool>(val & 1);
   } else if (std::is_same<T, double>::value) {
@@ -65,11 +67,11 @@ C10_HOST_DEVICE inline T uniform_int_transformation(V val) {
 }
 
 template <typename T, typename V>
-C10_HOST_DEVICE inline dist_acctype<T> uniform_real_transformation(V val, T from, T to) {
+C10_HOST_DEVICE inline dist_acctype<T> uniform_real(V val, T from, T to) {
   constexpr auto MASK = static_cast<V>((static_cast<uint64_t>(1) << std::numeric_limits<T>::digits) - 1);
   constexpr auto DIVISOR = static_cast<dist_acctype<T>>(1) / (static_cast<uint64_t>(1) << std::numeric_limits<T>::digits);
   dist_acctype<T> x = (val & MASK) * DIVISOR;
   return (x * (to - from) + from);
 }
 
-} // namespace at
+}} // namespace at::transformation
@@ -157,7 +157,7 @@ struct Vec256 {
   static Vec256<T> arange(T base = static_cast<T>(0), step_t step = static_cast<step_t>(1)) {
     Vec256 vec;
     for (int64_t i = 0; i < size(); i++) {
-      vec.values[i] = base + i * step;
+      vec.values[i] = base + static_cast<step_t>(i) * step;
     }
     return vec;
   }
 
@@ -44,6 +44,7 @@ def TypedDict(name, attrs, total=True):  # type: ignore
     default:
         AT_ERROR("${api_name} not supported on ${Type} for ", dispatch_scalar_type);
 }
+${switch_epilogue}
 """)
 
 LEGACY_TH_DEFINITION_CASE = CodeTemplate("""\
@@ -1414,19 +1415,7 @@ def emit_body(env, option, scalar_type_cases):
 
                 if ret['kind'] == 'arguments':
                     case_body.extend([call + ';' for call in calls])
-                    arguments_indices = ret['arguments']
-                    arguments = [option['arguments'][argi]
-                                 for argi in arguments_indices]
-                    if len(arguments_indices) == 1:
-                        arg = arguments[0]
-                        case_body.append("return {};".format(arg['name']))
-                    else:
-                        types = [to_return_type(arg, option)['type']
-                                 for arg in arguments]
-                        # TODO: check for move semantics...
-                        names = [arg['name'] for arg in arguments]
-                        case_body.append(CodeTemplate("return std::tuple<${types}>(${names});").substitute(
-                            types=types, names=names))
+                    # return handled later
                 elif ret['kind'] == 'type':
                     assert len(calls) == 1
                     call = calls[0]
@@ -1444,7 +1433,24 @@ def emit_body(env, option, scalar_type_cases):
                     raise Exception("NYI - return handling")
 
                 cases.append(LEGACY_TH_DEFINITION_CASE.substitute(case_env, case_body=case_body))
-        body.append(LEGACY_TH_DEFINITION_SWITCH_STATEMENT.substitute(env, cases=cases, switch_prologue=switch_prologue))
+        switch_epilogue = ''
+        if ret['kind'] == 'arguments':
+            arguments_indices = ret['arguments']
+            arguments = [option['arguments'][argi]
+                         for argi in arguments_indices]
+            if len(arguments_indices) == 1:
+                arg = arguments[0]
+                switch_epilogue = "return {};".format(arg['name'])
+            else:
+                types = [to_return_type(arg, option)['type']
+                         for arg in arguments]
+                # TODO: check for move semantics...
+                names = [arg['name'] for arg in arguments]
+                switch_epilogue = CodeTemplate("return std::tuple<${types}>(${names});").substitute(
+                    types=types, names=names)
+        body.append(LEGACY_TH_DEFINITION_SWITCH_STATEMENT.substitute(env, cases=cases,
+                                                                     switch_prologue=switch_prologue,
+                                                                     switch_epilogue=switch_epilogue))
         return body
 
     def process_legacy_th_option(option):
 
@@ -124,7 +124,8 @@ at::Tensor& random_from_to_impl(at::Tensor& self, int64_t from, c10::optional<in
     int64_t to_inc = 0;
     if (isFloatingType(iter.dtype())) {
       AT_DISPATCH_FLOATING_TYPES_AND2(at::ScalarType::Half, at::ScalarType::BFloat16, self.scalar_type(), "random_from_to_range_calc", [&] {
-        to_inc = std::numeric_limits<scalar_t>::max() > std::numeric_limits<int64_t>::max() ? std::numeric_limits<int64_t>::max() : static_cast<int64_t>(std::numeric_limits<scalar_t>::max());
+        constexpr int64_t scalar_t_max = static_cast<int64_t>(1) << std::numeric_limits<scalar_t>::digits;
+        to_inc = scalar_t_max > std::numeric_limits<int64_t>::max() ? std::numeric_limits<int64_t>::max() : static_cast<int64_t>(scalar_t_max);
         from = update_from<scalar_t>(from);
         TORCH_CHECK(from < to_inc, "random_ expects 'from' casted to dtype to be less than or equal to 'to_inc' casted to dtype, but got from=", from, " > to_inc=", to_inc);
       });
 
@@ -22,9 +22,10 @@ Tensor& pow_out(Tensor& result, const Tensor& base, Scalar exp) {
   TORCH_CHECK(!(isIntegralType(base.scalar_type(), true) &&
               exp.isIntegral(true) && exp.toLong() < 0),
               "Integers to negative integer powers are not allowed.");
-  if (exp.toDouble() == 0.0) {
+  // Avoid runtime error when typecasting
+  if (!exp.isComplex() && (exp.toDouble() == 0.0)) {
     result.resize_as_(base).fill_(1);
-  } else if (exp.toDouble() == 1.0) {
+  } else if (!exp.isComplex() && (exp.toDouble() == 1.0)) {
     result.resize_as_(base).copy_(base);
   } else {
     auto iter = TensorIterator::unary_op(result, base,
@@ -52,12 +53,28 @@ Tensor& pow_(Tensor& base, Scalar alpha) {
 }
 
 Tensor pow(const Tensor& base, const Tensor& exp) {
-  Tensor result = at::empty({0}, base.options());
+  // If the exponent is complex, the result needs to be complex
+  // we can't rely on result_type because it will break current
+  // handling
+  // TODO: change it to use type promotion after #37098 is merged
+  ScalarType dtype = (exp.is_complex() ? exp.scalar_type() : base.scalar_type());
+  Tensor result = at::empty({0}, base.options().dtype(dtype));
   return native::pow_out(result, base, exp);
 }
 
 Tensor pow(const Tensor& base, Scalar exp) {
-  Tensor result = at::empty_like(base, MemoryFormat::Preserve);
+  // If the exponent is complex, the result needs to be complex
+  // we can't rely on result_type because it will break current
+  // handling for other datatypes
+  // TODO: change it to use type promotion after #37098 is merged
+  ScalarType dtype = (exp.isComplex() ? exp.type() : base.scalar_type());
+  Tensor result = at::empty({0}, base.options().dtype(dtype));
+  if (exp.isComplex()) {
+    // The type checking logic in unary_op TensorIterator does not allow
+    // a float tensor to output to a complex tensor, but binary ops allow it
+    // so we create a tensor for the exponent to avoid using this iterator until its fixed
+    return native::pow_out(result, base, c10::scalar_to_tensor(exp, base.device()));
+  }
   return native::pow_out(result, base, exp);
 }
Original file line number	Diff line number	Diff line change
`@@ -57,9 +57,9 @@ struct uniform_int_from_to_distribution {`
`57`	`57`	`std::is_same<T, float>::value \|\|`
`58`	`58`	`std::is_same<T, at::BFloat16>::value) && range_ >= 1ULL << 32)`
`59`	`59`	`{`
`60`		`- return uniform_int_from_to_transformation<T>(generator->random64(), range_, base_);`
	`60`	`+ return transformation::uniform_int_from_to<T>(generator->random64(), range_, base_);`
`61`	`61`	`} else {`
`62`		`- return uniform_int_from_to_transformation<T>(generator->random(), range_, base_);`
	`62`	`+ return transformation::uniform_int_from_to<T>(generator->random(), range_, base_);`
`63`	`63`	`}`
`64`	`64`	`}`
`65`	`65`
`@@ -76,7 +76,7 @@ struct uniform_int_full_range_distribution {`
`76`	`76`
`77`	`77`	`template <typename RNG>`
`78`	`78`	`C10_HOST_DEVICE inline T operator()(RNG generator) {`
`79`		`- return uniform_int_full_range_transformation<T>(generator->random64());`
	`79`	`+ return transformation::uniform_int_full_range<T>(generator->random64());`
`80`	`80`	`}`
`81`	`81`
`82`	`82`	`};`
`@@ -91,9 +91,9 @@ struct uniform_int_distribution {`
`91`	`91`	`template <typename RNG>`
`92`	`92`	`C10_HOST_DEVICE inline T operator()(RNG generator) {`
`93`	`93`	`if (std::is_same<T, double>::value \|\| std::is_same<T, int64_t>::value) {`
`94`		`- return uniform_int_transformation<T>(generator->random64());`
	`94`	`+ return transformation::uniform_int<T>(generator->random64());`
`95`	`95`	`} else {`
`96`		`- return uniform_int_transformation<T>(generator->random());`
	`96`	`+ return transformation::uniform_int<T>(generator->random());`
`97`	`97`	`}`
`98`	`98`	`}`
`99`	`99`
`@@ -115,9 +115,9 @@ struct uniform_real_distribution {`
`115`	`115`	`template <typename RNG>`
`116`	`116`	`C10_HOST_DEVICE inline dist_acctype<T> operator()(RNG generator){`
`117`	`117`	`if(std::is_same<T, double>::value) {`
`118`		`- return uniform_real_transformation<T>(generator->random64(), from_, to_);`
	`118`	`+ return transformation::uniform_real<T>(generator->random64(), from_, to_);`
`119`	`119`	`} else {`
`120`		`- return uniform_real_transformation<T>(generator->random(), from_, to_);`
	`120`	`+ return transformation::uniform_real<T>(generator->random(), from_, to_);`
`121`	`121`	`}`
`122`	`122`	`}`
`123`	`123`
Original file line number	Diff line number	Diff line change
`@@ -157,7 +157,7 @@ struct Vec256 {`
`157`	`157`	`static Vec256<T> arange(T base = static_cast<T>(0), step_t step = static_cast<step_t>(1)) {`
`158`	`158`	`Vec256 vec;`
`159`	`159`	`for (int64_t i = 0; i < size(); i++) {`
`160`		`- vec.values[i] = base + i * step;`
	`160`	`+ vec.values[i] = base + static_cast<step_t>(i) * step;`
`161`	`161`	`}`
`162`	`162`	`return vec;`
`163`	`163`	`}`