Add ScalarType argument to Type::options() (pytorch#19270)

Roy Li · facebook-github-bot · commit ab78449e8c30 · 2019-04-21T21:16:07.000-07:00
Summary: Pull Request resolved: pytorch#19270 ghimport-source-id: a5ade61 Differential Revision: D14938707 Pulled By: li-roy fbshipit-source-id: 018fb3f01706531a06515d6d861e5683a455a705
diff --git a/aten/src/ATen/Context.h b/aten/src/ATen/Context.h
@@ -176,6 +176,11 @@ CAFFE2_API TypeExtendedInterface& getType(const Tensor&);
 
 CAFFE2_API Allocator* getCPUAllocator();
 
+static inline DeprecatedTypeProperties& getNonVariableDeprecatedTypeProperties(Backend p, ScalarType s) {
+  return globalDeprecatedTypePropertiesRegistry().getDeprecatedTypeProperties(
+      p, s, /*is_variable*/false);
+}
+
 static inline DeprecatedTypeProperties& CPU(ScalarType s) {
   return globalDeprecatedTypePropertiesRegistry().getDeprecatedTypeProperties(
       Backend::CPU, s, /*is_variable*/false);
diff --git a/aten/src/ATen/core/Type.h b/aten/src/ATen/core/Type.h
@@ -176,30 +176,25 @@ struct CAFFE2_API Type {
     return this != &other;
   }
 
-  /// Constructs the `TensorOptions` from a type and a `device_index`.
-  TensorOptions options(int16_t device_index = -1) const {
-    return TensorOptions().dtype(typeMeta())
+  TensorOptions options(ScalarType s, int16_t device_index = -1) const {
+    return TensorOptions().dtype(s)
                           .device(device_type(), device_index)
                           .layout(layout())
                           .is_variable(is_variable());
   }
 
   /// Constructs the `TensorOptions` from a type and a Device.  Asserts that
   /// the device type matches the device type of the type.
-  TensorOptions options(c10::optional<Device> device_opt) const {
+  TensorOptions options(ScalarType s, c10::optional<Device> device_opt) const {
     if (!device_opt.has_value()) {
-      return options(-1);
+      return options(s, -1);
     } else {
       Device device = device_opt.value();
       AT_ASSERT(device.type() == device_type());
-      return options(device.index());
+      return options(s, device.index());
     }
   }
 
-  operator TensorOptions() const {
-    return options();
-  }
-
   // example
   // virtual Tensor * add(Tensor & a, Tensor & b) = 0;
   virtual Tensor abs(const Tensor & self) const = 0;
diff --git a/aten/src/ATen/function_wrapper.py b/aten/src/ATen/function_wrapper.py
@@ -1604,7 +1604,8 @@ def emit_body(env, option, scalar_type_cases):
                     # e.g. x.sum(0) and x.sum() return the same type. We explicitly cast to the
                     # ScalarType before constructing the scalar_tensor to avoid overflow checking.
                     elif ret['type'] == 'accreal' or ret['type'] == 'real':
-                        return_scalar = 'return at::scalar_tensor(convert<${ScalarType}>(${call}), options());'
+                        return_scalar = ('return at::scalar_tensor(convert<${ScalarType}>(${call}), '
+                                         'options(ScalarType::${ScalarName}));')
                         case_body.append(CodeTemplate(return_scalar).substitute(case_env, call=call))
                     else:
                         # we using int64_t for long in the API, so correct it here...
diff --git a/aten/src/ATen/templates/Type.h b/aten/src/ATen/templates/Type.h
@@ -119,30 +119,25 @@ struct CAFFE2_API Type {
     return this != &other;
   }
 
-  /// Constructs the `TensorOptions` from a type and a `device_index`.
-  TensorOptions options(int16_t device_index = -1) const {
-    return TensorOptions().dtype(typeMeta())
+  TensorOptions options(ScalarType s, int16_t device_index = -1) const {
+    return TensorOptions().dtype(s)
                           .device(device_type(), device_index)
                           .layout(layout())
                           .is_variable(is_variable());
   }
 
   /// Constructs the `TensorOptions` from a type and a Device.  Asserts that
   /// the device type matches the device type of the type.
-  TensorOptions options(c10::optional<Device> device_opt) const {
+  TensorOptions options(ScalarType s, c10::optional<Device> device_opt) const {
     if (!device_opt.has_value()) {
-      return options(-1);
+      return options(s, -1);
     } else {
       Device device = device_opt.value();
       AT_ASSERT(device.type() == device_type());
-      return options(device.index());
+      return options(s, device.index());
     }
   }
 
-  operator TensorOptions() const {
-    return options();
-  }
-
   // example
   // virtual Tensor * add(Tensor & a, Tensor & b) = 0;
   ${pure_virtual_type_method_declarations}
diff --git a/test/cpp/api/tensor_options.cpp b/test/cpp/api/tensor_options.cpp
@@ -66,18 +66,18 @@ TEST(TensorOptionsTest, ConstructsWellFromCPUTypes) {
   options = TensorOptions(kInt);
   REQUIRE_OPTIONS(kCPU, -1, kInt, kStrided);
 
-  options = TensorOptions(getNonVariableType(Backend::SparseCPU, kFloat));
+  options = TensorOptions(getNonVariableDeprecatedTypeProperties(Backend::SparseCPU, kFloat));
   REQUIRE_OPTIONS(kCPU, -1, kFloat, kSparse);
 
-  options = TensorOptions(getNonVariableType(Backend::SparseCPU, kByte));
+  options = TensorOptions(getNonVariableDeprecatedTypeProperties(Backend::SparseCPU, kByte));
   REQUIRE_OPTIONS(kCPU, -1, kByte, kSparse);
 }
 
 TEST(TensorOptionsTest, ConstructsWellFromCPUTensors) {
   auto options = empty(5, kDouble).options();
   REQUIRE_OPTIONS(kCPU, -1, kDouble, kStrided);
 
-  options = empty(5, getNonVariableType(Backend::SparseCPU, kByte)).options();
+  options = empty(5, getNonVariableDeprecatedTypeProperties(Backend::SparseCPU, kByte)).options();
   REQUIRE_OPTIONS(kCPU, -1, kByte, kSparse);
 }
 
diff --git a/test/cpp/api/tensor_options_cuda.cpp b/test/cpp/api/tensor_options_cuda.cpp
@@ -42,25 +42,25 @@ TEST(TensorOptionsTest, ConstructsWellFromCUDATypes_CUDA) {
   options = CUDA(kInt).options();
   REQUIRE_OPTIONS(kCUDA, -1, kInt, kStrided);
 
-  options = getNonVariableType(Backend::SparseCUDA, kFloat).options();
+  options = getNonVariableDeprecatedTypeProperties(Backend::SparseCUDA, kFloat).options();
   REQUIRE_OPTIONS(kCUDA, -1, kFloat, kSparse);
 
-  options = getNonVariableType(Backend::SparseCUDA, kByte).options();
+  options = getNonVariableDeprecatedTypeProperties(Backend::SparseCUDA, kByte).options();
   REQUIRE_OPTIONS(kCUDA, -1, kByte, kSparse);
 
   options = CUDA(kFloat).options(/*device=*/5);
   REQUIRE_OPTIONS(kCUDA, 5, kFloat, kStrided);
 
   options =
-      getNonVariableType(Backend::SparseCUDA, kFloat).options(/*device=*/5);
+      getNonVariableDeprecatedTypeProperties(Backend::SparseCUDA, kFloat).options(/*device=*/5);
   REQUIRE_OPTIONS(kCUDA, 5, kFloat, kSparse);
 }
 
 TEST(TensorOptionsTest, ConstructsWellFromCUDATensors_MultiCUDA) {
   auto options = empty(5, device(kCUDA).dtype(kDouble)).options();
   REQUIRE_OPTIONS(kCUDA, 0, kDouble, kStrided);
 
-  options = empty(5, getNonVariableType(Backend::SparseCUDA, kByte)).options();
+  options = empty(5, getNonVariableDeprecatedTypeProperties(Backend::SparseCUDA, kByte)).options();
   REQUIRE_OPTIONS(kCUDA, 0, kByte, kSparse);
 
   if (torch::cuda::device_count() > 1) {
diff --git a/tools/autograd/templates/Functions.h b/tools/autograd/templates/Functions.h
@@ -35,13 +35,13 @@ struct TypeAndSize {
   /* implicit */
   TypeAndSize(const Tensor & t)
     : sizes(t.sizes().vec())
-    , type(&t.dispatch_type()) {}
+    , type(&t.type()) {}
 
   Tensor zeros() { return at::zeros(sizes, *type); }
 
 private:
   std::vector<int64_t> sizes;
-  Type* type;
+  at::DeprecatedTypeProperties* type;
 };
 
 ${autograd_function_declarations}
diff --git a/torch/csrc/autograd/engine.cpp b/torch/csrc/autograd/engine.cpp
@@ -334,7 +334,7 @@ static variable_list call_post_hooks(Function& fn, variable_list outputs, const
   return outputs;
 }
 
-static bool is_compatible_type(const at::Type& expected, const at::Type& actual) {
+static bool is_compatible_type(const at::DeprecatedTypeProperties& expected, const at::DeprecatedTypeProperties& actual) {
   // Types are compatible if they exactly match or if the gradient is a sparse
   // version of the expected type.
   return expected == actual || (actual.is_sparse() &&
@@ -372,7 +372,7 @@ static void validate_outputs(const edge_list& edges, variable_list& grads, const
       }
       grads[i] = at::sum_to(std::move(grads[i]), metadata.shape());
     }
-    if (!is_compatible_type(metadata.type(), grads[i].dispatch_type())) {
+    if (!is_compatible_type(metadata.type(), grads[i].type())) {
       std::stringstream ss;
       ss << "invalid gradient at index " << i << " - expected type ";
       ss << metadata.type() << " but got " << grads[i].type();
diff --git a/torch/csrc/autograd/function.h b/torch/csrc/autograd/function.h
@@ -130,7 +130,7 @@ struct TORCH_API Function : std::enable_shared_from_this<Function> {
   /// Adds the type and shape metadata for a new input. Returns the index of
   /// of the new input.
   uint32_t add_input_metadata(
-    const at::Type& type
+    const at::DeprecatedTypeProperties& type
   , at::IntArrayRef shape
   , at::Device device) noexcept {
     uint32_t input_nr = input_metadata_.size();
diff --git a/torch/csrc/autograd/input_metadata.h b/torch/csrc/autograd/input_metadata.h
@@ -12,17 +12,17 @@ namespace torch { namespace autograd {
 struct InputMetadata {
   InputMetadata() = default;
 
-  InputMetadata(const at::Type& type, at::IntArrayRef shape, at::Device device)
+  InputMetadata(const at::DeprecatedTypeProperties& type, at::IntArrayRef shape, at::Device device)
   : type_{&type} , shape_{shape}, device_{device} { }
 
   InputMetadata(const at::Tensor& t)
-  : InputMetadata(t.dispatch_type(), t.sizes(), t.device()) { }
+  : InputMetadata(t.type(), t.sizes(), t.device()) { }
 
   bool is_valid() const {
     return type_ != nullptr;
   }
 
-  const at::Type& type() const {
+  const at::DeprecatedTypeProperties& type() const {
     AT_ASSERT(type_);
     return *type_;
   }
@@ -40,7 +40,7 @@ struct InputMetadata {
   }
 
 private:
-  const at::Type* type_ = nullptr;
+  const at::DeprecatedTypeProperties* type_ = nullptr;
   at::DimVector shape_;
   at::Device device_ = at::kCPU;
 };
diff --git a/torch/csrc/autograd/python_function.cpp b/torch/csrc/autograd/python_function.cpp
@@ -46,14 +46,15 @@ namespace torch { namespace autograd {
 VariableInfo::VariableInfo(const Variable& var)
   : type(&var.dispatch_type())
   , device(var.device())
+  , scalar_type(var.scalar_type())
   , size(var.sizes().vec())
   , requires_grad(var.requires_grad()) {
 }
 
 Variable VariableInfo::zeros(at::OptionalDeviceGuard& device_guard) const {
   // NB: This will NOT work if we ever get mixed device gradients
   device_guard.reset_device(device);
-  return at::zeros(size, type->options());
+  return at::zeros(size, type->options(scalar_type));
 }
 
 auto PyFunction::legacy_apply(const variable_list& inputs) -> variable_list {
diff --git a/torch/csrc/autograd/python_function.h b/torch/csrc/autograd/python_function.h
@@ -25,6 +25,7 @@ struct VariableInfo {
 
   at::Type* type;
   at::Device device = at::kCPU;
+  at::ScalarType scalar_type = at::kFloat;
   std::vector<int64_t> size;
   bool requires_grad;
 };
diff --git a/torch/csrc/autograd/python_legacy_variable.cpp b/torch/csrc/autograd/python_legacy_variable.cpp
@@ -46,7 +46,8 @@ static PyObject *THPVariable_pynew(PyTypeObject* type, PyObject *args, PyObject
   if (!data || data == Py_None) {
     // For legacy serialization code, create an empty tensor. This is also used
     // by nn.Parameter() with no arguments.
-    auto var = at::empty({0}, torch::tensors::get_default_tensor_type().options());
+    auto scalar_type = torch::tensors::get_default_scalar_type();
+    auto var = at::empty({0}, torch::tensors::get_default_tensor_type().options(scalar_type));
     tensor = static_cast<Variable&>(var).data();
   } else if (THPVariable_Check(data)) {
     tensor = ((THPVariable*)data)->cdata.data();
diff --git a/torch/csrc/autograd/python_variable_indexing.cpp b/torch/csrc/autograd/python_variable_indexing.cpp
@@ -110,15 +110,15 @@ static Variable sequenceToVariable(const at::Type& type, PyObject* seq) {
   return torch::utils::indexing_tensor_from_data(idx_type, kLong, c10::nullopt, seq);
 }
 
-static Variable valueToTensor(const at::Type & type, PyObject* value) {
+static Variable valueToTensor(const at::Type & type, const ScalarType scalar_type, PyObject* value) {
   if (THPVariable_Check(value)) {
     return reinterpret_cast<THPVariable*>(value)->cdata;
   }
   if (THPUtils_checkLong(value) || PyBool_Check(value)) {
-    return at::scalar_tensor(Scalar(THPUtils_unpackLong(value)), type.options());
+    return at::scalar_tensor(Scalar(THPUtils_unpackLong(value)), type.options(scalar_type));
   }
   if (PyFloat_Check(value)) {
-    return at::scalar_tensor(Scalar(THPUtils_unpackDouble(value)), type.options());
+    return at::scalar_tensor(Scalar(THPUtils_unpackDouble(value)), type.options(scalar_type));
   }
   throw TypeError("can't assign a %s to a %s", Py_TYPE(value)->tp_name, type.toString());
 }
@@ -334,7 +334,7 @@ int THPVariable_setitem(PyObject* self, PyObject* index, PyObject* py_value) {
 
   auto& self_ = reinterpret_cast<THPVariable*>(self)->cdata;
   OptionalDeviceGuard device_guard(device_of(self_));
-  auto value = valueToTensor(self_.dispatch_type(), py_value);
+  auto value = valueToTensor(self_.dispatch_type(), self_.scalar_type(), py_value);
 
   // handle simple types: integers, slices, ellipsis, bool
   if (index == Py_False) { // NOLINT(cppcoreguidelines-pro-type-cstyle-cast)
diff --git a/torch/csrc/autograd/variable.cpp b/torch/csrc/autograd/variable.cpp
@@ -214,7 +214,7 @@ const std::shared_ptr<Function>& Variable::grad_fn() const {
       fn->storage_offset = data().storage_offset();
       fn->set_next_edges(collect_next_edges(diff_view_meta->base_));
       fn->add_input_metadata(
-        diff_view_meta->base_.dispatch_type()
+        diff_view_meta->base_.type()
       , sizes() // Note: sizes(), not base_.sizes(), is intentional
       , diff_view_meta->base_.device());
       diff_view_meta->grad_fn_ = std::move(fn);
diff --git a/torch/csrc/cuda/comm.cpp b/torch/csrc/cuda/comm.cpp
@@ -59,7 +59,7 @@ std::vector<Tensor> broadcast(const Tensor& tensor, IntArrayRef devices) {
     tensors.push_back(tensor);
     for (auto device : devices.slice(1)) {
       _device_guard.set_index(device);
-      tensors.push_back(at::empty(tensor.sizes(), type.options()));
+      tensors.push_back(at::empty(tensor.sizes(), type.options(tensor.scalar_type())));
     }
     nccl::broadcast(tensors);
   } else {
diff --git a/torch/csrc/jit/passes/shape_analysis.cpp b/torch/csrc/jit/passes/shape_analysis.cpp
@@ -157,10 +157,9 @@ class ShapePropagator {
       return *iv;
     }
     if (CompleteTensorTypePtr type = type_->cast<CompleteTensorType>()) {
-      auto backend =
-          type->device().is_cpu() ? at::Backend::CPU : at::Backend::CUDA;
+      auto attype = type->device().is_cpu() ?
+          at::CPU(type->scalarType()) : at::CUDA(type->scalarType());
       at::DeviceGuard device_guard(type->device());
-      auto& attype = at::getNonVariableType(backend, type->scalarType());
       auto t =
           at::empty_strided(type->sizes(), type->strides(), attype.options())
               .zero_();
diff --git a/torch/csrc/utils/tensor_new.cpp b/torch/csrc/utils/tensor_new.cpp

Original file line number	Diff line number	Diff line change
`@@ -334,7 +334,7 @@ static variable_list call_post_hooks(Function& fn, variable_list outputs, const`
`334`	`334`	`return outputs;`
`335`	`335`	`}`
`336`	`336`
`337`		`-static bool is_compatible_type(const at::Type& expected, const at::Type& actual) {`
	`337`	`+static bool is_compatible_type(const at::DeprecatedTypeProperties& expected, const at::DeprecatedTypeProperties& actual) {`
`338`	`338`	`// Types are compatible if they exactly match or if the gradient is a sparse`
`339`	`339`	`// version of the expected type.`
`340`	`340`	`return expected == actual \|\| (actual.is_sparse() &&`
`@@ -372,7 +372,7 @@ static void validate_outputs(const edge_list& edges, variable_list& grads, const`
`372`	`372`	`}`
`373`	`373`	`grads[i] = at::sum_to(std::move(grads[i]), metadata.shape());`
`374`	`374`	`}`
`375`		`- if (!is_compatible_type(metadata.type(), grads[i].dispatch_type())) {`
	`375`	`+ if (!is_compatible_type(metadata.type(), grads[i].type())) {`
`376`	`376`	`std::stringstream ss;`
`377`	`377`	`ss << "invalid gradient at index " << i << " - expected type ";`
`378`	`378`	`ss << metadata.type() << " but got " << grads[i].type();`
Original file line number	Diff line number	Diff line change
`@@ -110,15 +110,15 @@ static Variable sequenceToVariable(const at::Type& type, PyObject* seq) {`
`110`	`110`	`return torch::utils::indexing_tensor_from_data(idx_type, kLong, c10::nullopt, seq);`
`111`	`111`	`}`
`112`	`112`
`113`		`-static Variable valueToTensor(const at::Type & type, PyObject* value) {`
	`113`	`+static Variable valueToTensor(const at::Type & type, const ScalarType scalar_type, PyObject* value) {`
`114`	`114`	`if (THPVariable_Check(value)) {`
`115`	`115`	`return reinterpret_cast<THPVariable*>(value)->cdata;`
`116`	`116`	`}`
`117`	`117`	`if (THPUtils_checkLong(value) \|\| PyBool_Check(value)) {`
`118`		`- return at::scalar_tensor(Scalar(THPUtils_unpackLong(value)), type.options());`
	`118`	`+ return at::scalar_tensor(Scalar(THPUtils_unpackLong(value)), type.options(scalar_type));`
`119`	`119`	`}`
`120`	`120`	`if (PyFloat_Check(value)) {`
`121`		`- return at::scalar_tensor(Scalar(THPUtils_unpackDouble(value)), type.options());`
	`121`	`+ return at::scalar_tensor(Scalar(THPUtils_unpackDouble(value)), type.options(scalar_type));`
`122`	`122`	`}`
`123`	`123`	`throw TypeError("can't assign a %s to a %s", Py_TYPE(value)->tp_name, type.toString());`
`124`	`124`	`}`
`@@ -334,7 +334,7 @@ int THPVariable_setitem(PyObject* self, PyObject* index, PyObject* py_value) {`
`334`	`334`
`335`	`335`	`auto& self_ = reinterpret_cast<THPVariable*>(self)->cdata;`
`336`	`336`	`OptionalDeviceGuard device_guard(device_of(self_));`
`337`		`- auto value = valueToTensor(self_.dispatch_type(), py_value);`
	`337`	`+ auto value = valueToTensor(self_.dispatch_type(), self_.scalar_type(), py_value);`
`338`	`338`
`339`	`339`	`// handle simple types: integers, slices, ellipsis, bool`
`340`	`340`	`if (index == Py_False) { // NOLINT(cppcoreguidelines-pro-type-cstyle-cast)`
Original file line number	Diff line number	Diff line change
`@@ -59,7 +59,7 @@ std::vector<Tensor> broadcast(const Tensor& tensor, IntArrayRef devices) {`
`59`	`59`	`tensors.push_back(tensor);`
`60`	`60`	`for (auto device : devices.slice(1)) {`
`61`	`61`	`_device_guard.set_index(device);`
`62`		`- tensors.push_back(at::empty(tensor.sizes(), type.options()));`
	`62`	`+ tensors.push_back(at::empty(tensor.sizes(), type.options(tensor.scalar_type())));`
`63`	`63`	`}`
`64`	`64`	`nccl::broadcast(tensors);`
`65`	`65`	`} else {`