// Copyright (c) Facebook, Inc. and its affiliates. // All rights reserved. // // This source code is licensed under the BSD-style license found in the // LICENSE file in the root directory of this source tree. #include #include namespace at::functorch { template struct NewBlahBatchRuleHelperSymInt; template struct NewBlahBatchRuleHelperSymInt> { static std::tuple> apply( const Tensor& tensor, std::optional batch_dim, SymIntArrayRef shape, T... extra_args) { const auto bdim_size = tensor.sym_size(batch_dim.value()); c10::SmallVector new_shape; new_shape.reserve(shape.size() + 1); new_shape.emplace_back(bdim_size); new_shape.insert(new_shape.end(), shape.begin(), shape.end()); return std::make_tuple(Func(tensor, new_shape, std::forward(extra_args)...), 0); } }; template struct NewBlahBatchRuleHelper; template struct NewBlahBatchRuleHelper> { static std::tuple> apply( const Tensor& tensor, std::optional batch_dim, IntArrayRef shape, T... extra_args) { const auto bdim_size = tensor.size(batch_dim.value()); VmapDimVector new_shape; new_shape.reserve(shape.size() + 1); new_shape.emplace_back(bdim_size); new_shape.insert(new_shape.end(), shape.begin(), shape.end()); return std::make_tuple(Func(tensor, new_shape, std::forward(extra_args)...), 0); } }; // USAGE: NEW_BLAH_BATCH_RULE(at::new_zeros) // INCORRECT USAGE: NEW_BLAH_BATCH_RULE(&at::new_zeros) // It is important that this macro is not passed a function pointer!! #define NEW_BLAH_BATCH_RULE(fn) SINGLE_ARG(\ NewBlahBatchRuleHelper<\ decltype(&fn),\ &fn,\ c10::guts::function_traits::parameter_types>::apply) #define NEW_BLAH_BATCH_RULE_SYMINT(fn) SINGLE_ARG(\ NewBlahBatchRuleHelperSymInt<\ decltype(&fn),\ &fn,\ c10::guts::function_traits::parameter_types>::apply) static std::tuple> _new_zeros_with_same_feature_meta_batch_rule( const Tensor& self, std::optional self_bdim, const Tensor& other, std::optional other_bdim, int64_t self_num_batch_dims) { // The "self, other" naming is too confusing // What this function really says is "create a new tangent for this base". const auto& base = other; const auto& base_bdim = other_bdim; const auto& tangent = self; const auto& tangent_bdim = self_bdim; // Three case: // Case 1 Case 2 Case 3 // base [6] [B, 6] [B, 6] // tangent [B, 5] [5] [B, 5] // result [B, 6] [B, 6] [B, 6] // Case 2 & 3 if (base_bdim) { auto base_ = moveBatchDimToFront(base, base_bdim); Tensor tangent_ = tangent; if (tangent_bdim.has_value()) { // tangent [B, K0, K1, 5] // base_ [B, 6] // We want to move B to after the Ks, so that self_num_batch_dims // (which really means tangent_num_batch_dims) isn't interfered with. // [B, K0, K1, 6] -> [K0, K1, B, 6] // // [K0, K1, B, 6], [B, 5], 2 -> [K0, K1, B, 5] tangent_ = tangent.movedim(*tangent_bdim, self_num_batch_dims); } const auto result = at::_new_zeros_with_same_feature_meta(tangent_, base_, self_num_batch_dims); return std::make_tuple(result, self_num_batch_dims); } // Case 1: auto tangent_ = moveBatchDimToFront(tangent, tangent_bdim); auto result = at::_new_zeros_with_same_feature_meta(tangent_, base, self_num_batch_dims + 1); return std::make_tuple(result, 0); } static std::tuple> linspace_logspace_batch_rule_helper( const at::Tensor& start, std::optional start_bdim, const at::Tensor& end, std::optional end_bdim, int64_t steps, std::optional base, std::optional dtype, std::optional layout, std::optional device, std::optional pin_memory) { auto batch_size = get_bdim_size2(start, start_bdim, end, end_bdim); auto start_ = ensure_has_bdim(start, start_bdim.has_value(), batch_size); auto end_ = ensure_has_bdim(end, end_bdim.has_value(), batch_size); start_ = moveBatchDimToFront(start_, start_bdim); end_ = moveBatchDimToFront(end_, end_bdim); auto tensor_options = at::TensorOptions().dtype(dtype).layout(layout).device(device).pinned_memory(pin_memory); Tensor result; if (steps == 0){ result = at::full({batch_size, 0}, 0, tensor_options); } else if (steps == 1){ result = start_.new_empty({batch_size}, tensor_options).copy_(start_).unsqueeze(1); } else { result = (start_ + at::arange(0, steps, tensor_options).unsqueeze_(1) * (end_ - start_) / (steps - 1)).transpose(0, 1); } if (base){ result = at::pow(*base, result); } if (dtype && result.scalar_type() != *dtype){ result = result.to(*dtype); } return std::make_tuple(result, 0); } static std::tuple> linspace_Tensor_Tensor_batch_rule( const at::Tensor& start, std::optional start_bdim, const at::Tensor& end, std::optional end_bdim, int64_t steps, std::optional dtype, std::optional layout, std::optional device, std::optional pin_memory){ return linspace_logspace_batch_rule_helper(start, start_bdim, end, end_bdim, steps, std::nullopt, dtype, layout, device, pin_memory); } static std::tuple> linspace_Tensor_Scalar_batch_rule( const at::Tensor& start, std::optional start_bdim, const at::Scalar& end, int64_t steps, std::optional dtype, std::optional layout, std::optional device, std::optional pin_memory){ auto end_t = at::native::wrapped_scalar_tensor(end, start.device()); return linspace_logspace_batch_rule_helper(start, start_bdim, end_t, std::nullopt, steps, std::nullopt, dtype, layout, device, pin_memory); } static std::tuple> linspace_Scalar_Tensor_batch_rule( const at::Scalar& start, const at::Tensor& end, std::optional end_bdim, int64_t steps, std::optional dtype, std::optional layout, std::optional device, std::optional pin_memory){ auto start_t = at::native::wrapped_scalar_tensor(start, end.device()); return linspace_logspace_batch_rule_helper(start_t, std::nullopt, end, end_bdim, steps, std::nullopt, dtype, layout, device, pin_memory); } static std::tuple> logspace_Tensor_Tensor_batch_rule( const at::Tensor& start, std::optional start_bdim, const at::Tensor& end, std::optional end_bdim, int64_t steps, double base, std::optional dtype, std::optional layout, std::optional device, std::optional pin_memory){ return linspace_logspace_batch_rule_helper(start, start_bdim, end, end_bdim, steps, std::make_optional(base), dtype, layout, device, pin_memory); } static std::tuple> logspace_Tensor_Scalar_batch_rule( const at::Tensor& start, std::optional start_bdim, const at::Scalar& end, int64_t steps, double base, std::optional dtype, std::optional layout, std::optional device, std::optional pin_memory){ auto end_t = at::native::wrapped_scalar_tensor(end, start.device()); return linspace_logspace_batch_rule_helper(start, start_bdim, end_t, std::nullopt, steps, std::make_optional(base), dtype, layout, device, pin_memory); } static std::tuple> logspace_Scalar_Tensor_batch_rule( const at::Scalar& start, const at::Tensor& end, std::optional end_bdim, int64_t steps, double base, std::optional dtype, std::optional layout, std::optional device, std::optional pin_memory){ auto start_t = at::native::wrapped_scalar_tensor(start, end.device()); return linspace_logspace_batch_rule_helper(start_t, std::nullopt, end, end_bdim, steps, std::make_optional(base), dtype, layout, device, pin_memory); } static bool _has_same_storage_numel_batch_rule(const Tensor& a, const Tensor& b) { return true; } TORCH_LIBRARY_IMPL(aten, FuncTorchBatched, m) { m.impl("_has_same_storage_numel", _has_same_storage_numel_batch_rule); VMAP_SUPPORT(ones_like, BASIC_UNARY_BATCH_RULE(ATEN_FN(ones_like))); VMAP_SUPPORT(zeros_like, BASIC_UNARY_BATCH_RULE(ATEN_FN(zeros_like))); VMAP_SUPPORT(empty_like, BASIC_UNARY_BATCH_RULE(ATEN_FN(empty_like))); VMAP_SUPPORT(randn_like, BASIC_UNARY_BATCH_RULE(ATEN_FN(randn_like))); VMAP_SUPPORT(rand_like, BASIC_UNARY_BATCH_RULE(ATEN_FN(rand_like))); VMAP_SUPPORT(full_like, BASIC_UNARY_BATCH_RULE(ATEN_FN(full_like))); VMAP_SUPPORT(new_empty, NEW_BLAH_BATCH_RULE_SYMINT(ATEN_FN(new_empty))); VMAP_SUPPORT(new_zeros, NEW_BLAH_BATCH_RULE_SYMINT(ATEN_FN(new_zeros))); VMAP_SUPPORT(new_ones, NEW_BLAH_BATCH_RULE_SYMINT(ATEN_FN(new_ones))); VMAP_SUPPORT(new_full, NEW_BLAH_BATCH_RULE_SYMINT(ATEN_FN(new_full))); VMAP_SUPPORT2(linspace, Tensor_Tensor, linspace_Tensor_Tensor_batch_rule); VMAP_SUPPORT2(linspace, Tensor_Scalar, linspace_Tensor_Scalar_batch_rule); VMAP_SUPPORT2(linspace, Scalar_Tensor, linspace_Scalar_Tensor_batch_rule); VMAP_SUPPORT2(logspace, Tensor_Tensor, logspace_Tensor_Tensor_batch_rule); VMAP_SUPPORT2(logspace, Tensor_Scalar, logspace_Tensor_Scalar_batch_rule); VMAP_SUPPORT2(logspace, Scalar_Tensor, logspace_Scalar_Tensor_batch_rule); VMAP_SUPPORT(_new_zeros_with_same_feature_meta, _new_zeros_with_same_feature_meta_batch_rule); // Not sure how to add the ones with irregular args to the mix cleanly (i.e. randint takes an extra int parameter) } } // namespace at::functorch