pytorch
diff --git a/‎.github/workflows/lint.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/lint.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 0 deletions b/‎.gitignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎.jenkins/pytorch/test.sh‎
Lines changed: 2 additions & 2 deletions b/‎.jenkins/pytorch/test.sh‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎android/pytorch_android/src/main/cpp/pytorch_jni_jit.cpp‎
Lines changed: 8 additions & 1 deletion b/‎android/pytorch_android/src/main/cpp/pytorch_jni_jit.cpp‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎android/pytorch_android/src/main/cpp/pytorch_jni_lite.cpp‎
Lines changed: 18 additions & 5 deletions b/‎android/pytorch_android/src/main/cpp/pytorch_jni_lite.cpp‎
Lines changed: 18 additions & 5 deletions
diff --git a/‎aten/src/ATen/core/List.h‎
Lines changed: 4 additions & 0 deletions b/‎aten/src/ATen/core/List.h‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎aten/src/ATen/native/BinaryOps.cpp‎
Lines changed: 48 additions & 13 deletions b/‎aten/src/ATen/native/BinaryOps.cpp‎
Lines changed: 48 additions & 13 deletions
diff --git a/‎aten/src/ATen/native/PointwiseOps.cpp‎
Lines changed: 11 additions & 0 deletions b/‎aten/src/ATen/native/PointwiseOps.cpp‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎aten/src/ATen/native/TensorFactories.cpp‎
Lines changed: 48 additions & 14 deletions b/‎aten/src/ATen/native/TensorFactories.cpp‎
Lines changed: 48 additions & 14 deletions
@@ -105,7 +105,7 @@ jobs:
         run: |
           set -eux
           pip install flake8
-          rm -rf .circleci
+          rm -rf .circleci tools/clang_format_new.py
           flake8 --exit-zero > ${GITHUB_WORKSPACE}/flake8-output.txt
           cat ${GITHUB_WORKSPACE}/flake8-output.txt
       - name: Add annotations
 
@@ -252,3 +252,6 @@ TAGS
 
 # clang-format storage location used by apply_clang_format.py
 .clang-format-bin
+
+# clangd background index
+.clangd/
@@ -182,7 +182,7 @@ test_aten() {
 }
 
 test_torchvision() {
-  pip_install --user git+https://github.com/pytorch/vision.git@44a5bae933655ed7ff798669a43452b833f9ce01
+  pip_install --user git+https://github.com/pytorch/vision.git@43e94b39bcdda519c093ca11d99dfa2568aa7258
 }
 
 test_libtorch() {
@@ -270,9 +270,9 @@ elif [[ "${BUILD_ENVIRONMENT}" == *libtorch* ]]; then
   # TODO: run some C++ tests
   echo "no-op at the moment"
 elif [[ "${BUILD_ENVIRONMENT}" == *-test1 || "${JOB_BASE_NAME}" == *-test1 ]]; then
-  test_torchvision
   test_python_nn
 elif [[ "${BUILD_ENVIRONMENT}" == *-test2 || "${JOB_BASE_NAME}" == *-test2 ]]; then
+  test_torchvision
   test_python_all_except_nn
   test_aten
   test_libtorch
 
@@ -26,6 +26,12 @@ namespace {
 struct JITCallGuard {
   // AutoGrad is disabled for mobile by default.
   torch::autograd::AutoGradMode no_autograd_guard{false};
+  // VariableType dispatch is not included in default mobile build. We need set
+  // this guard globally to avoid dispatch error (only for dynamic dispatch).
+  // Thanks to the unification of Variable class and Tensor class it's no longer
+  // required to toggle the NonVariableTypeMode per op - so it doesn't hurt to
+  // always set NonVariableTypeMode for inference only use case.
+  torch::AutoNonVariableTypeMode non_var_guard{true};
   // Disable graph optimizer to ensure list of unused ops are not changed for
   // custom mobile build.
   torch::jit::GraphOptimizerEnabledGuard no_optimizer_guard{false};
@@ -111,11 +117,11 @@ class PytorchJni : public facebook::jni::HybridClass<PytorchJni> {
         /* need_inputs */ false,
         /* sampled */ false);
 #endif
-    JITCallGuard guard;
   }
 
   PytorchJni(facebook::jni::alias_ref<jstring> modelPath) {
     preModuleLoadSetup();
+    JITCallGuard guard;
     module_ = torch::jit::load(std::move(modelPath->toStdString()));
     module_.eval();
   }
@@ -147,6 +153,7 @@ class PytorchJni : public facebook::jni::HybridClass<PytorchJni> {
           "Could not get buffer for asset '%s'",
           assetName->toStdString().c_str());
     }
+    JITCallGuard guard;
     module_ = torch::jit::load(torch::make_unique<MemoryReadAdapter>(
         assetBuffer, AAsset_getLength(asset)));
     AAsset_close(asset);
 
@@ -12,10 +12,23 @@
 
 #include "pytorch_jni_common.h"
 
-using namespace pytorch_jni;
-
 namespace pytorch_jni {
 
+namespace {
+
+struct LiteJITCallGuard {
+  // VariableType dispatch is not included in default mobile build. We need set
+  // this guard globally to avoid dispatch error (only for dynamic dispatch).
+  // Thanks to the unification of Variable class and Tensor class it's no longer
+  // required to toggle the NonVariableTypeMode per op - so it doesn't hurt to
+  // always set NonVariableTypeMode for inference only use case.
+  // TODO: avoid having to set this guard for custom mobile build with mobile
+  // interpreter.
+  torch::AutoNonVariableTypeMode non_var_guard{true};
+};
+
+} // namespace
+
 class PytorchJni : public facebook::jni::HybridClass<PytorchJni> {
  private:
   friend HybridBase;
@@ -31,6 +44,7 @@ class PytorchJni : public facebook::jni::HybridClass<PytorchJni> {
   }
 
   PytorchJni(facebook::jni::alias_ref<jstring> modelPath) {
+    LiteJITCallGuard guard;
     module_ = torch::jit::_load_for_mobile(std::move(modelPath->toStdString()));
   }
 
@@ -55,8 +69,7 @@ class PytorchJni : public facebook::jni::HybridClass<PytorchJni> {
     }
 
     auto output = [&]() {
-      torch::autograd::AutoGradMode guard(false);
-      at::AutoNonVariableTypeMode non_var_type_mode(true);
+      LiteJITCallGuard guard;
       return module_.forward(inputs);
     }();
     return JIValue::newJIValueFromAtIValue(output);
@@ -78,7 +91,7 @@ class PytorchJni : public facebook::jni::HybridClass<PytorchJni> {
     }
     if (auto method = module_.find_method(methodName)) {
       auto output = [&]() {
-        at::AutoNonVariableTypeMode non_var_type_mode(true);
+        LiteJITCallGuard guard;
         return module_.run_method(methodName, inputs);
       }();
       return JIValue::newJIValueFromAtIValue(output);
 
@@ -139,6 +139,10 @@ class ListIterator final : public std::iterator<std::random_access_iterator_tag,
   ListElementReference<T, Iterator> operator*() const {
     return {iterator_};
   }
+  
+  ListElementReference<T, Iterator> operator[](typename List<T>::size_type offset) const {
+    return {iterator_ + offset};
+  }
 
 private:
   explicit ListIterator(Iterator iterator): iterator_(std::move(iterator)) {}
 
@@ -59,13 +59,27 @@ Tensor& add_(Tensor& self, const Tensor& other, Scalar alpha) {
 }
 
 Tensor& div_out(Tensor& result, const Tensor& self, const Tensor& other) {
+  if (isIntegralType(result.scalar_type(), /*includeBool=*/ true)) {
+    TORCH_WARN_ONCE(
+      "Integer division of tensors using div or / is deprecated, ",
+      "and in a future release div will perform true division as in Python 3. ",
+      "Use true_divide or floor_divide (// in Python) instead.");
+  }
+
   auto iter = TensorIterator::binary_op(result, self, other,
     /*check_mem_overlap=*/true);
   div_stub(iter.device_type(), iter);
   return result;
 }
 
 Tensor div(const Tensor& self, const Tensor& other) {
+  if (isIntegralType(self.scalar_type(), /*includeBool=*/ true)
+      && isIntegralType(other.scalar_type(), /*includeBool=*/ true)) {
+    TORCH_WARN_ONCE(
+      "Integer division of tensors using div or / is deprecated, ",
+      "and in a future release div will perform true division as in Python 3. ",
+      "Use true_divide or floor_divide (// in Python) instead.");
+  }
   Tensor result;
   auto iter = TensorIterator::binary_op(result, self, other);
   div_stub(iter.device_type(), iter);
@@ -94,13 +108,6 @@ Tensor& remainder_(Tensor& self, const Tensor& other) {
   return native::remainder_out(self, self, other);
 }
 
-Tensor truncate(const Tensor& tensor) {
-  if (tensor.is_floating_point()) {
-    return tensor.trunc();
-  }
-  return tensor;
-}
-
 Tensor& true_divide_out(Tensor& result, const Tensor& self, const Tensor& divisor) {
   TORCH_CHECK(!isIntegralType(result.scalar_type(), /*includeBool=*/ true),
             "True division requires a floating output type, but got ",
@@ -131,14 +138,34 @@ Tensor true_divide(const Tensor& self, const Tensor& divisor) {
   return iter.output();
 }
 
-Tensor floor_divide(const Tensor& input, const Tensor& other) {
-  Tensor out = input / other;
-  return truncate(out);
+Tensor& floor_divide_out(Tensor& result, const Tensor& self, const Tensor& other) {
+  auto iter = TensorIterator::binary_op(result, self, other,
+    /*check_mem_overlap=*/true);
+  div_stub(iter.device_type(), iter);
+
+  if (result.is_floating_point()) {
+    result.trunc_();
+  }
+
+  return result;
+}
+
+Tensor floor_divide(const Tensor& self, const Tensor& other) {
+  Tensor result;
+  auto iter = TensorIterator::binary_op(result, self, other);
+
+  div_stub(iter.device_type(), iter);
+
+  auto out = iter.output();
+  if (out.is_floating_point()) {
+    out.trunc_();
+  }
+
+  return out;
 }
 
-Tensor floor_divide(const Tensor& input, Scalar other) {
-  Tensor out = input / other;
-  return truncate(out);
+Tensor& floor_divide_(Tensor& self, const Tensor& other) {
+  return native::floor_divide_out(self, self, other);
 }
 
 Tensor& mul_out(Tensor& result, const Tensor& self, const Tensor& other) {
@@ -661,6 +688,14 @@ Tensor min(const Tensor& self, const Tensor& other) {
 
 Tensor& min_(Tensor& self, const Tensor& other) { return at::min_out(self, self, other); }
 
+Tensor floor_divide(const Tensor& self, Scalar other) {
+  return at::floor_divide(self, wrapped_scalar_tensor(other));
+}
+
+Tensor& floor_divide_(Tensor& self, Scalar other) {
+  return at::floor_divide_out(self, self, wrapped_scalar_tensor(other));
+}
+
 Tensor& fmod_out(Tensor & result, const Tensor& self, const Tensor& other) {
   auto iter = TensorIterator::binary_op(result, self, other,
                                         /*check_mem_overlap=*/true);
 
@@ -69,6 +69,17 @@ Tensor& addcdiv_out(
     const Tensor& tensor1,
     const Tensor& tensor2,
     Scalar value) {
+  if (isIntegralType(tensor1.scalar_type(), /*includeBool=*/ true)
+      && isIntegralType(tensor2.scalar_type(), /*includeBool=*/ true)) {
+    TORCH_WARN_ONCE(
+      "Integer division with addcdiv is deprecated, and in a future  ",
+      "release addcdiv will perform a true division of tensor1 and tensor2. ",
+      "The current addcdiv behavior can be replicated using floor_divide ",
+      "for integral inputs (self + value * tensor1 // tensor2) and ",
+      "division for float inputs (self + value * tensor1 / tensor2). ",
+      "The new addcdiv behavior can be implemented with true_divide ",
+      "(self + value * torch.true_divide(tensor1, tensor2).");
+  }
   checkBackend("addcdiv_cpu", result, self.options().backend());
   auto iter = at::TensorIterator();
   iter.set_check_mem_overlap(true);
 
@@ -134,6 +134,7 @@ Tensor empty_cpu(IntArrayRef size, const TensorOptions& options_, c10::optional<
 
   auto memory_format = options.memory_format_opt().value_or(MemoryFormat::Contiguous);
   tensor.unsafeGetTensorImpl()->empty_tensor_restride(memory_format);
+
   return tensor;
 }
 
@@ -342,18 +343,47 @@ Tensor& eye_out_cpu(Tensor& result, int64_t n, int64_t m) {
 
 // ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ full ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Tensor full(IntArrayRef size, Scalar fill_value, const TensorOptions& options) {
-  if (options.layout() == kSparse) {
-    AT_ERROR("full(...) is not implemented for sparse layout");
+namespace {
+
+// Performs dtype inference for full
+TensorOptions infer_full_options(
+  Scalar fill_value,
+  const TensorOptions& options) {
+
+  if (!options.has_dtype()) {
+    if (fill_value.isIntegral(true)) {
+      TORCH_WARN_ONCE(
+        "Deprecation warning: In a future PyTorch release torch.full ",
+        "will no longer return tensors of floating dtype by default. ",
+        "Instead, a bool fill_value will return a tensor of torch.bool dtype, ",
+        "and an integral fill_value will return a tensor of torch.long dtype. ",
+        "Set the optional `dtype` or `out` arguments to suppress this warning."
+      );
+    } else if (fill_value.isComplex()) {
+      auto scalar_type = (get_default_dtype() == ScalarType::Double) ?
+                            ScalarType::ComplexDouble :
+                            ScalarType::ComplexFloat;
+      return options.dtype(scalar_type);
+    }
   }
-  auto result = at::empty(size, options);
+
+  return options;
+}
+
+} // anonymous namespace
+
+Tensor full(IntArrayRef size, Scalar fill_value, const TensorOptions& options) {
+  TORCH_CHECK(options.layout() != kSparse,
+    "full(...) is not implemented for sparse layout");
+
+  auto result = at::empty(size, infer_full_options(fill_value, options));
   return result.fill_(fill_value);
 }
 
 Tensor& full_out(Tensor& result, IntArrayRef size, Scalar fill_value) {
-  if (result.is_sparse()) {
-    AT_ERROR("full(...) is not implemented for sparse layout");
-  }
+  TORCH_CHECK(!result.is_sparse(),
+    "full(...) is not implemented for sparse layout");
+
   result.resize_(size);
   return result.fill_(fill_value);
 }
@@ -404,19 +434,19 @@ Tensor logspace(
 // ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ones ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Tensor ones(IntArrayRef size, const TensorOptions& options) {
-  return native::full(size, /*fill_value=*/1, options);
+  return native::full(size, /*fill_value=*/1., options);
 }
 
 Tensor& ones_out(Tensor& result, IntArrayRef size) {
-  return native::full_out(result, size, /*fill_value=*/1);
+  return native::full_out(result, size, /*fill_value=*/1.);
 }
 
 Tensor ones_like(
     const Tensor& self,
     const TensorOptions& options,
     c10::optional<c10::MemoryFormat> optional_memory_format) {
   auto result = at::empty_like(self, options, optional_memory_format);
-  return result.fill_(1);
+  return result.fill_(1.);
 }
 
 // ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ scalar_tensor ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -746,7 +776,7 @@ Tensor zeros(IntArrayRef size, const TensorOptions& options) {
 
 Tensor& zeros_out(Tensor& result, IntArrayRef size) {
   if (result.is_sparse()) {
-    result.sparse_resize_and_clear_(size, size.size(), 0);
+    result.sparse_resize_and_clear_(size, size.size(), 0.);
     return result;
   } else {
     result.resize_(size);
@@ -960,22 +990,26 @@ Tensor full(
     Scalar fill_value,
     optional<DimnameList> names,
     const TensorOptions& options) {
-  auto result = at::empty(size, names, options);
+
+  TORCH_CHECK(options.layout() != kSparse,
+    "full(...) is not implemented for sparse layout");
+
+  auto result = at::empty(size, names, infer_full_options(fill_value, options));
   return result.fill_(fill_value);
 }
 
 Tensor ones(
     IntArrayRef size,
     optional<DimnameList> names,
     const TensorOptions& options) {
-  return native::full(size, /*fill_value=*/1, names, options);
+  return native::full(size, /*fill_value=*/1., names, options);
 }
 
 Tensor zeros(
     IntArrayRef size,
     optional<DimnameList> names,
     const TensorOptions& options) {
-  return native::full(size, /*fill_value=*/0, names, options);
+  return native::full(size, /*fill_value=*/0., names, options);
 }
 
 Tensor randn(