pytorch
diff --git a/‎aten/src/ATen/core/jit_type.h‎
Lines changed: 187 additions & 118 deletions b/‎aten/src/ATen/core/jit_type.h‎
Lines changed: 187 additions & 118 deletions
diff --git a/‎aten/src/ATen/core/type.cpp‎
Lines changed: 265 additions & 76 deletions b/‎aten/src/ATen/core/type.cpp‎
Lines changed: 265 additions & 76 deletions
@@ -39,6 +39,7 @@ std::ostream& operator<<(std::ostream & out, const Type & t) {
       }
       out << ")";
     }
+
     if (value->undefined() && *value->undefined()) {
       out << "[Undefined]";
     }
@@ -81,55 +82,9 @@ AnyTypePtr AnyType::get() {
   return value;
 }
 
-template <typename T>
-static bool compatible_optional(c10::optional<T> e, T a) {
-  return !e.has_value() || e.value() == a;
-}
-
-static bool compatible_varying_shape(const VaryingShape& e, at::IntArrayRef a) {
-  if (!e.size().has_value()) {
-    return true;
-  }
-
-  if (e.size().value() != a.size()) {
-    return false;
-  }
-
-  auto ndim = a.size();
-  for (size_t i = 0; i < ndim; i++) {
-    if (!compatible_optional(e[i], a[i])) {
-      return false;
-    }
-  }
-  return true;
-}
-
-bool TensorType::isCompatibleWithInCurrentExecutionContext(
-    at::Tensor& t) const {
-  // any updates to `isSubtypeOf`, TensorType c-tor or
-  // `isCompatibleWithInCurrentExecutionContext` need to maintain the following
-  // `TensorType::create(actual_tensor)->isSubtypeOf(expected_type)
-  //  == expected_type->isCompatibleWithInCurrentExecutionContext(t)`
-  if (!t.defined()) {
-    return compatible_optional(undefined(), !t.defined());
-  }
-
-  return compatible_varying_shape(sizes(), t.sizes()) &&
-      (t.is_sparse() || t.is_mkldnn() ||
-       compatible_varying_shape(strides(), t.strides())) &&
-      compatible_optional(
-             requiresGrad(), t.requires_grad() && at::GradMode::is_enabled()) &&
-      compatible_optional(scalarType(), t.scalar_type()) &&
-      compatible_optional(device(), t.device());
-}
-
 TensorTypePtr TensorType::get() {
   static auto value = TensorType::create(
-      {},
-      {},
-      VaryingShape{c10::optional<size_t>()},
-      VaryingShape{c10::optional<size_t>()},
-      {});
+      {}, {}, VaryingShape<ShapeSymbol>{}, VaryingShape<Stride>{}, {});
   return value;
 }
 
@@ -527,51 +482,111 @@ std::string TensorType::str() const {
   return "Tensor";
 }
 
-VaryingShape VaryingShape::merge(const VaryingShape& other) const {
+template <typename T>
+VaryingShape<T> VaryingShape<T>::merge(const VaryingShape<T>& other) const {
   if (!dims_ || !other.dims_ || dims_->size() != other.dims_->size()) {
-    return VaryingShape();
+    return VaryingShape<T>();
   }
-  ListOfOptionalInts dims;
+  ListOfOptionalElements dims;
   for (size_t i = 0, n = dims_->size(); i < n; i++) {
     dims.push_back(merge_primitive((*dims_)[i], (*other.dims_)[i]));
   }
-  return VaryingShape(std::move(dims));
+  return VaryingShape<T>(std::move(dims));
 }
 
-TensorTypePtr TensorType::merge(TensorTypePtr other) const {
+VaryingShape<int64_t> TensorType::sizes() const {
+  if (!sizes_.size().has_value()) {
+    return VaryingShape<int64_t>();
+  }
+  return VaryingShape<int64_t>(
+      fmap(*sizes_.sizes(), [](c10::optional<ShapeSymbol> ss) {
+        // we turn symbolic shapes into unknowns
+        return ss.has_value() && ss->is_static()
+            ? c10::optional<int64_t>(ss->static_size())
+            : c10::nullopt;
+      }));
+}
+
+TensorTypePtr TensorType::merge(TensorTypePtr other, bool merge_sizes) const {
   auto scalar_type = merge_primitive(scalarType(), other->scalarType());
   auto dev = merge_primitive(device(), other->device());
-  auto sz = sizes().merge(other->sizes());
-  auto srs = strides().merge(other->strides());
+  auto sprops = stride_properties().merge(other->stride_properties());
   auto gr = merge_primitive(requiresGrad(), other->requiresGrad());
   auto undef = merge_primitive(undefined(), other->undefined());
-  return TensorType::create(scalar_type, dev, sz, srs, gr, undef);
+  return TensorType::create(
+      scalar_type,
+      dev,
+      merge_sizes ? symbolic_sizes().merge(other->symbolic_sizes())
+                  : symbolic_sizes(),
+      sprops,
+      gr,
+      undef);
+}
+
+bool TensorType::operator==(const c10::Type& rhs) const {
+  if (rhs.kind() != kind()) {
+    return false;
+  }
+  auto rt = rhs.expect<TensorType>();
+
+  return scalar_type_ == rt->scalarType() && sizes() == rt->sizes() &&
+      stride_properties() == rt->stride_properties() &&
+      device() == rt->device() && requiresGrad() == rt->requiresGrad() &&
+      undefined() == rt->undefined();
 }
 
-std::ostream& operator<<(std::ostream & out, const VaryingShape & vs) {
+template <typename T>
+std::ostream& operator<<(std::ostream& out, const VaryingShape<T>& vs) {
+  out << "(";
+  if (!vs.size()) {
+    out << "*)";
+    return out;
+  }
 
-    out << "(";
-    if (!vs.size()) {
-      out << "*)";
-      return out;
+  for (size_t i = 0; i < vs.size(); i++) {
+    if (i > 0) {
+      out << ", ";
     }
-
-    for (size_t i = 0; i < vs.size(); i++)
-    {
-      if (i > 0) {
-        out << ", ";
-      }
-      if (vs[i].has_value())
-      {
-        out << vs[i].value();
-      }
-      else
-      {
-        out << "*";
-      }
+    if (vs[i].has_value()) {
+      out << vs[i].value();
+    } else {
+      out << "*";
     }
-    out << ")";
-    return out;
+  }
+  out << ")";
+  return out;
+}
+
+template std::ostream& operator<<(
+    std::ostream& out,
+    const VaryingShape<int64_t>& vs);
+template std::ostream& operator<<(
+    std::ostream& out,
+    const VaryingShape<ShapeSymbol>& vs);
+template std::ostream& operator<<(
+    std::ostream& out,
+    const VaryingShape<Stride>& vs);
+
+std::ostream& operator<<(std::ostream& os, const ShapeSymbol& s) {
+  os << "SS(" << s.value_ << ')';
+  return os;
+}
+
+std::ostream& operator<<(std::ostream& os, const Stride& s) {
+  os << "{";
+  if (s.stride_index_.has_value()) {
+    os << *s.stride_index_;
+  } else {
+    os << "*";
+  }
+  os << ":";
+  if (s.stride_.has_value()) {
+    os << *s.stride_;
+  } else {
+    os << "*";
+  }
+  os << '}';
+  return os;
 }
 
 TupleTypePtr TupleType::createNamed(
@@ -708,6 +723,180 @@ std::string TupleType::python_str_impl(TypePrinter printer) const {
   return ss.str();
 }
 
+static std::vector<bool> findContiguous(
+    const at::IntArrayRef& sizes,
+    const at::IntArrayRef& strides) {
+  AT_ASSERT(sizes.size() == strides.size());
+  std::vector<bool> cont(sizes.size());
+  for (size_t i = 0; i < sizes.size(); ++i) {
+    const auto expected_stride =
+        (i + 1 < sizes.size()) ? sizes[i + 1] * strides[i + 1] : 1;
+    cont[i] = (strides[i] == expected_stride);
+  }
+  return cont;
+}
+
+VaryingShape<int64_t> TensorType::strides() const {
+  if (!strides_.size().has_value()) {
+    return VaryingShape<int64_t>();
+  }
+  std::vector<c10::optional<int64_t>> ss(*strides_.size());
+  for (size_t i = 0; i < *strides_.size(); i++) {
+    if (!strides_[i].has_value()) {
+      continue;
+    }
+    auto s = *strides_[i];
+    if (s.stride_index_.has_value() && s.stride_.has_value()) {
+      ss[*s.stride_index_] = *s.stride_;
+    }
+  }
+  return VaryingShape<int64_t>(ss);
+}
+
+VaryingShape<Stride> TensorType::computeStrideProps(
+    at::IntArrayRef sizes,
+    at::IntArrayRef strides) {
+  std::vector<size_t> stride_indices(sizes.size());
+  std::iota(stride_indices.begin(), stride_indices.end(), 0);
+
+  std::sort(
+      stride_indices.begin(),
+      stride_indices.end(),
+      [&strides](const int& a, const int& b) {
+        // break ties in case of unsqueezed dims
+        // i.e. (1, 1, 5)
+        if (strides[a] == strides[b]) {
+          return a > b;
+        }
+        return strides[a] < strides[b];
+      });
+
+  std::vector<Stride> stride_properties;
+  for (size_t i = 0; i < stride_indices.size(); i++) {
+    Stride s{stride_indices[i], false, strides[stride_indices[i]]};
+    // innermost stride expected to be 1
+    // TODO: turn contiguous_ into an enum CONTIGUOUS, NONCONTIGUOUS,
+    // BROADCASTED
+    if (i == 0) {
+      s.contiguous_ = strides[stride_indices[i]] == 1;
+    } else {
+      s.contiguous_ = strides[stride_indices[i]] == 1 ||
+          (strides[stride_indices[i]] != 0 &&
+           strides[stride_indices[i]] ==
+               strides[stride_indices[i - 1]] * sizes[stride_indices[i - 1]]);
+    }
+    stride_properties.push_back(s);
+  }
+
+  return VaryingShape<Stride>{stride_properties};
+}
+
+std::atomic<size_t> ShapeSymbol::num_symbols{1};
+
+template struct VaryingShape<c10::ShapeSymbol>;
+template struct VaryingShape<bool>;
+template struct VaryingShape<size_t>;
+template struct VaryingShape<int64_t>;
+
+TensorType::TensorType(
+    c10::optional<at::ScalarType> scalar_type,
+    c10::optional<Device> device,
+    const VaryingShape<ShapeSymbol>& sizes,
+    const VaryingShape<Stride>& strides,
+    c10::optional<bool> requires_grad,
+    c10::optional<bool> undefined)
+    : Type(TypeKind::TensorType),
+      scalar_type_(scalar_type),
+      device_(device),
+      sizes_(sizes),
+      strides_(strides),
+      requires_grad_(requires_grad),
+      undefined_(undefined) {}
+
+TensorTypePtr TensorType::create(const at::Tensor& t) {
+  VaryingShape<bool> contiguity;
+  VaryingShape<size_t> stride_indices;
+  VaryingShape<int64_t> strides;
+  VaryingShape<int64_t> sizes;
+  if (!t.is_mkldnn() && !t.is_sparse()) {
+    sizes = VaryingShape<int64_t>{t.sizes().vec()};
+    strides = VaryingShape<int64_t>{t.strides().vec()};
+    return TensorType::create(
+        t.scalar_type(), t.device(), sizes, strides, t.requires_grad(), false);
+  }
+
+  return TensorType::create(
+      t.scalar_type(),
+      t.device(),
+      VaryingShape<ShapeSymbol>{},
+      VaryingShape<Stride>{},
+      t.requires_grad(),
+      false);
+}
+
+TensorTypePtr TensorType::create(
+    c10::optional<at::ScalarType> scalar_type,
+    c10::optional<Device> device,
+    const VaryingShape<int64_t>& sizes,
+    const VaryingShape<int64_t>& strides,
+    c10::optional<bool> requires_grad,
+    c10::optional<bool> undefined) {
+  TORCH_INTERNAL_ASSERT(sizes.concrete_sizes().has_value());
+  TORCH_INTERNAL_ASSERT(
+      !strides.concrete_sizes().has_value() ||
+      sizes.concrete_sizes()->size() == strides.concrete_sizes()->size());
+  auto sprops = strides.concrete_sizes().has_value()
+      ? computeStrideProps(*sizes.concrete_sizes(), *strides.concrete_sizes())
+      : VaryingShape<Stride>();
+
+  auto symbol_sizes =
+      VaryingShape<ShapeSymbol>::fromStaticShape(*sizes.concrete_sizes());
+  return TensorType::create(
+      scalar_type, device, symbol_sizes, sprops, requires_grad, undefined);
+}
+
+TensorTypePtr TensorType::create(
+    c10::optional<at::ScalarType> scalar_type,
+    c10::optional<Device> device,
+    const VaryingShape<ShapeSymbol>& sizes,
+    const VaryingShape<Stride>& strides,
+    c10::optional<bool> requires_grad,
+    c10::optional<bool> undefined) {
+  return TensorTypePtr(new TensorType(
+      scalar_type, device, sizes, strides, requires_grad, undefined));
+}
+
+TensorTypePtr TensorType::create(
+    c10::optional<at::ScalarType> scalar_type,
+    c10::optional<Device> device,
+    c10::optional<size_t> dim,
+    c10::optional<bool> requires_grad) {
+  return TensorType::create(
+      scalar_type,
+      device,
+      VaryingShape<ShapeSymbol>(dim),
+      VaryingShape<Stride>(dim),
+      requires_grad);
+}
+
+TensorTypePtr TensorType::createContiguous(
+    at::ScalarType scalar_type,
+    at::Device device,
+    at::IntArrayRef sizes) {
+  auto strides = contiguousStridesOf(sizes);
+  TORCH_INTERNAL_ASSERT(strides.size() == sizes.size());
+  return create(
+      scalar_type,
+      device,
+      VaryingShape<int64_t>(sizes),
+      VaryingShape<int64_t>(strides),
+      c10::nullopt);
+}
+
+const VaryingShape<ShapeSymbol>& TensorType::symbolic_sizes() const {
+  return sizes_;
+}
+
 bool TensorType::isSubtypeOfExt(const TypePtr rhs, std::ostream* why_not) const {
   if (auto rhs_p = rhs->cast<TensorType>()) {
     // if we have the same pointer, avoid computing the merge