#include #include #include #include namespace c10 { namespace impl { namespace { #ifndef STRIP_ERROR_MESSAGES std::string toString(std::optional k) { if (k.has_value()) { return toString(*k); } else { return "(catch all)"; } } #endif } OperatorEntry::OperatorEntry(OperatorName&& operator_name) : name_(std::move(operator_name)) , schema_() #ifndef C10_MOBILE , tags_() #endif , dispatchTable_() , dispatchKeyExtractor_(DispatchKeyExtractor::makeUninitialized()) , kernels_() , cpp_signature_() , sym_cpp_signature_() , is_observed_(ObservedOperators::isObserved(name_)) { // Pick up any backend fallbacks that were registered prior to this // OperatorEntry being created updateDispatchTableFull_(c10::Dispatcher::singleton()); } namespace { void checkSchema(const OperatorName& name, const FunctionSchema& from_def_, const std::string& from_def_debug, const KernelFunction& kernel, const FunctionSchema& inferred_, const std::string& inferred_debug) { // TODO: figure out if we can just directly save real schema at def time FunctionSchema from_def = from_def_.cloneWithRealTypes(kernel.isValidSymUnboxed()); FunctionSchema inferred = inferred_.cloneWithRealTypes(); std::optional schema_difference = findSchemaDifferences(from_def, inferred); if (schema_difference.has_value()) { TORCH_CHECK(false, "Inferred operator schema for a C++ kernel function doesn't match the expected function schema.\n" " operator: ", toString(name), "\n", " expected schema: ", toString(from_def), "\n", " ", from_def_debug, "\n", " inferred schema: ", toString(inferred), "\n", " ", inferred_debug, "\n", " reason: ", *schema_difference); } } } // anonymous namespace const AnnotatedKernel& OperatorEntry::missingKernel() const { static AnnotatedKernel kernel; return kernel; } const AnnotatedKernel& OperatorEntry::ambiguousAutogradOtherKernel() const { static AnnotatedKernel kernel( c10::KernelFunction::makeAmbiguousAutogradOther(), nullptr, "ambiguous_autogradother"); return kernel; } void OperatorEntry::assertSignatureIsCorrect(const CppSignature& call_signature, bool has_symint) const { if (has_symint) { if (C10_UNLIKELY(sym_cpp_signature_.has_value() && (call_signature != sym_cpp_signature_->signature))) { reportSignatureError(call_signature, *sym_cpp_signature_); } } else { if (C10_UNLIKELY(cpp_signature_.has_value() && (call_signature != cpp_signature_->signature))) { reportSignatureError(call_signature, *cpp_signature_); } } } void OperatorEntry::registerSchema(FunctionSchema&& schema, std::string&& debug, std::vector tags) { TORCH_INTERNAL_ASSERT(!schema_.has_value()); for (const auto& kernel : kernels_) { for (const auto &j : kernel.second) { if (j.inferred_function_schema != nullptr) { checkSchema(name_, schema, debug, j.kernel, *j.inferred_function_schema, j.debug); } } } // NB: don't register schema until after we've checked everything! dispatchKeyExtractor_.registerSchema(schema); schema_ = AnnotatedSchema(std::move(schema), std::move(debug)); #ifndef C10_MOBILE tags_ = std::move(tags); #endif } void OperatorEntry::deregisterSchema() { TORCH_INTERNAL_ASSERT(schema_.has_value()); schema_ = std::nullopt; dispatchKeyExtractor_.deregisterSchema(); } OperatorEntry::AnnotatedKernelContainerIterator OperatorEntry::registerKernel( const c10::Dispatcher& dispatcher, std::optional dispatch_key, KernelFunction kernel, std::optional cpp_signature, std::unique_ptr inferred_function_schema, std::string debug ) { // NB: cpp_signature doesn't get cleared even after the kernel that populated // it is deleted. This means you could poison the value of cpp_signature_ // with a bad signature value, and then it would permanently stay there until // you deregister the schema. This can't really be fixed, because we // only do a typed() test once in the lifetime of a TypedOperatorHandle, // which means if you could validly change the type of a cpp_signature, then // that would also invalidate the old TypedOperatorHandles. if (cpp_signature.has_value()) { auto& local_cpp_signature = kernel.isValidSymUnboxed() ? sym_cpp_signature_ : cpp_signature_; if (local_cpp_signature.has_value()) { TORCH_CHECK(*cpp_signature == local_cpp_signature->signature, "\nMismatch in kernel C++ signatures\n", " operator: ", (this->schema_.has_value() ? toString(this->schema_->schema) : toString(name_)), "\n", " ", (this->schema_.has_value() ? this->schema_->debug : "no debug info"), "\n", " kernel 1: ", local_cpp_signature->signature.name(), "\n", " dispatch key: ", toString(local_cpp_signature->dispatch_key), "\n", " ", local_cpp_signature->debug, "\n", " kernel 2: ", cpp_signature->name(), "\n", " dispatch key: ", toString(dispatch_key), "\n", " ", debug, "\n" ); } else { local_cpp_signature = CppSignatureWithDebug { *cpp_signature, debug, dispatch_key }; } } if (schema_ && inferred_function_schema) { checkSchema(name_, schema_->schema, schema_->debug, kernel, *inferred_function_schema, debug); } // Add the kernel to the kernels list, // possibly creating the list if this is the first kernel. // Redirect catchAll registrations to CompositeImplicitAutograd. auto& k = dispatch_key.has_value() ? kernels_[*dispatch_key] : kernels_[DispatchKey::CompositeImplicitAutograd]; #ifdef C10_DISPATCHER_ONE_KERNEL_PER_DISPATCH_KEY if (k[0].kernel.isValid()) { #else if (!k.empty()) { #endif // Suppress the warning for Meta key as we are overriding C++ meta functions with python meta functions // for some ops if (dispatch_key != DispatchKey::Meta) { TORCH_WARN_ONCE("Warning only once for all operators, other operators may also be overridden.\n", " Overriding a previously registered kernel for the same operator and the same dispatch key\n", " operator: ", (schema_.has_value() ? toString(schema_->schema) : toString(name_)), "\n", " ", (this->schema_.has_value() ? this->schema_->debug : "no debug info"), "\n", " dispatch key: ", toString(dispatch_key), "\n", " previous kernel: ", (cpp_signature_.has_value() ? cpp_signature_->debug : (sym_cpp_signature_.has_value() ? sym_cpp_signature_->debug : "no debug info")), "\n", " new kernel: ", debug ); } } #ifdef C10_DISPATCHER_ONE_KERNEL_PER_DISPATCH_KEY k[0].kernel = std::move(kernel); k[0].inferred_function_schema = std::move(inferred_function_schema); k[0].debug = std::move(debug); #else k.emplace_front(std::move(kernel), std::move(inferred_function_schema), std::move(debug)); #endif AnnotatedKernelContainerIterator inserted = k.begin(); // update the dispatch table, i.e. re-establish the invariant // that the dispatch table points to the newest kernel if (dispatch_key.has_value()) { updateDispatchTable_(dispatcher, *dispatch_key); } else { updateDispatchTableFull_(dispatcher); } return inserted; } void OperatorEntry::deregisterKernel_( const c10::Dispatcher& dispatcher, std::optional dispatch_key, AnnotatedKernelContainerIterator kernel ) { // Redirect catchAll deregistrations to CompositeImplicitAutograd. DispatchKey dk = dispatch_key.has_value() ? *dispatch_key : DispatchKey::CompositeImplicitAutograd; auto found = kernels_.find(dk); TORCH_INTERNAL_ASSERT(found != kernels_.end(), "Tried to deregister a kernel for dispatch key ", toString(dispatch_key), " but there are no kernels registered for this dispatch key. The operator is ", toString(name_)); auto& k = found->second; #ifdef C10_DISPATCHER_ONE_KERNEL_PER_DISPATCH_KEY // We are about to remove the array from the map, no need to do anything. #else k.erase(kernel); #endif if (k.empty()) { // the invariant says we don't want empty lists but instead remove the list from the map kernels_.erase(found); } updateDispatchTable_(dispatcher, dk); } void OperatorEntry::updateFallback(const c10::Dispatcher& dispatcher, DispatchKey dispatch_key) { updateDispatchTable_(dispatcher, dispatch_key); } const KernelFunction& OperatorEntry::computeDispatchTableEntry(const c10::Dispatcher& dispatcher, DispatchKey dispatch_key) const { return computeDispatchTableEntryWithDebug(dispatcher, dispatch_key).first.kernel; } bool OperatorEntry::hasKernelForAnyDispatchKey(DispatchKeySet ks) const { TORCH_INTERNAL_ASSERT(kernels_.find(DispatchKey::Undefined) == kernels_.end()); for (auto& kv : kernels_) { // Note [No Alias Keys in DispatchKeySet] if (!isAliasDispatchKey(kv.first) && ks.has(kv.first)) return true; } return false; } bool OperatorEntry::hasKernelForDispatchKey(DispatchKey k) const { TORCH_INTERNAL_ASSERT(kernels_.find(DispatchKey::Undefined) == kernels_.end()); auto it = kernels_.find(k); if (it == kernels_.end()) return false; return !it->second.empty(); } const KernelFunction& OperatorEntry::kernelForDispatchKey(DispatchKey k) const { auto it = kernels_.find(k); TORCH_CHECK(it != kernels_.end() && !it->second.empty(), "no kernel for ", k, " on ", name_); auto jt = it->second.begin(); TORCH_INTERNAL_ASSERT(jt->kernel.isValid()) return jt->kernel; } bool OperatorEntry::hasComputedKernelForDispatchKey(DispatchKey k) const { TORCH_CHECK(!isAliasDispatchKey(k), "Alias keys do not have runtime kernel registrations."); const auto dispatch_ix = getDispatchTableIndexForDispatchKey(k); TORCH_INTERNAL_ASSERT(dispatch_ix >= 0 && dispatch_ix < c10::num_runtime_entries, toString(k), dispatch_ix); return dispatchTable_[dispatch_ix].isValid(); } const AnnotatedKernel* OperatorEntry::getKernelForDispatchKey(DispatchKey dispatch_key) const{ auto kern_it = kernels_.find(dispatch_key); if (kern_it != kernels_.end()) { TORCH_INTERNAL_ASSERT(!kern_it->second.empty()); TORCH_INTERNAL_ASSERT(kern_it->second.front().kernel.isValid()); return &kern_it->second.front(); } return nullptr; } const std::vector& OperatorEntry::getTags() const { #if defined C10_MOBILE TORCH_CHECK(false, "tags are not saved for Mobile"); #else return tags_; #endif } std::pair OperatorEntry::computeDispatchTableEntryWithDebug(const c10::Dispatcher& dispatcher, DispatchKey dispatch_key) const { // [Note] DispatchTable computation // dispatchTable contains entries for runtime dispatch keys. // For any dispatch key, it'll pick a kernel using the following order: // (1) Use kernel if it's directly registered to this key // (2) Handle runtime keys that have kernels available from alias keys // (2.1) Use kernel from DispatchKey::CompositeExplicitAutogradNonFunctional if available. // This is used to register a kernel that works for all backends in inference, except "functional" backends // like LazyTensor/XLA. But it requires separate registration for Autograd keys to support training. // (2.2) Use kernel from DispatchKey::CompositeExplicitAutograd if available. // This is used to register a kernel that works for all backend in inference. But it requires // separate registration for Autograd keys to support training. // (2.3) Use kernel from DispatchKey::CompositeImplicitAutograd if available. // For autograd keys, we only use kernel from CompositeImplicitAutograd when there's no direct registration // to its corresponding backend key or CompositeExplicitAutograd. See Note [CompositeExplicitAutograd and CompositeImplicitAutograd]. // For AutogradOther, we eagerly return ambiguousAutogradOtherKernel() if there's registration to any of // its backends and ask backend extender to request a decicated Autograd key for the backend. // See Note [Ambiguity in AutogradOther kernel] for more details. // A CompositeExplicitAutograd kernel prevents CompositeImplicitAutograd kernel being used for Autograd keys, but it doesn't // cause confusion for AutogradOther. It's pretty straightforward to use Autograd (if available) // in this case. // (2.4) Use kernel from DispatchKey::Autograd if available // (2.5) Use kernel from DispatchKey::FuncTorchBatchedDecomposition if available // The implementation of (2.2) relies on the invariant that for a given backend, // `computeDispatchTableEntryWithDebug()` will be called for that backend's autograd key after the // backend key. See Note [Refresh Runtime Autograd entries in dispatchTable_] // (3) Use fallthrough kernel that are registered as fallback. // Alias Key Precedence: // CompositExplicitAutogradNonFunctional > CompositeExplicitAutograd > CompositeImplicitAutograd > Autograd // Note [CompositeExplicitAutograd and CompositeImplicitAutograd] // When there're registrations to both CompositeExplicitAutograd & CompositeImplicitAutograd & Autograd, from (2.2) we know CompositeExplicitAutograd // and Autograd kernels will be picked up and CompositeImplicitAutograd is overriden. // This is fine and in practice CompositeExplicitAutograd and CompositeImplicitAutograd shouldn't co-exist for an op. // TODO: Update alias key precedence after we add new alias keys AutogradDispatchCPUOrCUDA . // 1. Operator registration if (auto direct_registration = getKernelForDispatchKey(dispatch_key)) { return {*direct_registration, "kernel"}; } // 2.1 Use CompositeExplicitAutogradNonFunctional kernel if available. // See Note [Undefined in dispatchTable_] for the special handling for Undefined. if (dispatch_key == DispatchKey::Undefined || isIncludedInAlias(dispatch_key, DispatchKey::CompositeExplicitAutogradNonFunctional)) { if (auto default_backend_registration = getKernelForDispatchKey(DispatchKey::CompositeExplicitAutogradNonFunctional)) { return {*default_backend_registration, "default backend kernel"}; } } // 2.2 Use CompositeExplicitAutograd kernel if available. // See Note [Undefined in dispatchTable_] for the special handling for Undefined. if (dispatch_key == DispatchKey::Undefined || isIncludedInAlias(dispatch_key, DispatchKey::CompositeExplicitAutograd)) { if (auto default_backend_registration = getKernelForDispatchKey(DispatchKey::CompositeExplicitAutograd)) { return {*default_backend_registration, "default backend kernel"}; } } // Note when there's direct registration to CompositeExplicitAutograd, this code path will only be hit by // non backend keys (e.g AutogradXXX, Batched etc) due to (2.1). bool has_backend_kernel = hasKernelForAnyDispatchKey(getBackendKeySetFromAutograd(dispatch_key)) || // See Note [No Alias Keys in DispatchKeySet] hasKernelForDispatchKey(DispatchKey::CompositeExplicitAutograd); // 2.3. Use CompositeImplicitAutograd kernel if available. For autograd keys, we only use kernel from CompositeImplicitAutograd // when there's no direct registration to its corresponding backend key or CompositeExplicitAutograd. // For AutogradOther, we return ambiguousAutogradOtherKernel() if there's registration // to any of its backends. // See Note [Undefined in dispatchTable_] for the special handling for Undefined. // If the dispatch key is included in CompositeImplicitAutogradNestedTensor, // then we register it to nested-tensor kernel rather than // regular-tensor CompositeImplicitAutograd kernel. // We have no intention to change the behavior of Undefined, // so this nested-tensor branch requires `dispatch_key != DispatchKey::Undefined` // to let the original CompositeImplicitAutograd handle Undefined // See Note: [Disjoint AliasKeyset] The order for this alias key doesn't matter if (dispatch_key != DispatchKey::Undefined && isIncludedInAlias(dispatch_key, DispatchKey::CompositeImplicitAutogradNestedTensor)) { if (auto nested_registration = getKernelForDispatchKey(DispatchKey::CompositeImplicitAutogradNestedTensor)) { return {*nested_registration, "nested kernel"}; } } if (dispatch_key == DispatchKey::Undefined || isIncludedInAlias(dispatch_key, DispatchKey::CompositeImplicitAutograd)) { if (auto math_registration = getKernelForDispatchKey(DispatchKey::CompositeImplicitAutograd)) { if (dispatch_key == DispatchKey::AutogradOther && hasKernelForAnyDispatchKey(c10::autogradother_backends)) { return {ambiguousAutogradOtherKernel(), "ambiguous autogradother"}; } else if (!has_backend_kernel) { return {*math_registration, "math kernel"}; } } } // 2.4. For autograd backend keys, use kernel from DispatchKey::Autograd if available if (isIncludedInAlias(dispatch_key, DispatchKey::Autograd)) { if (auto autograd_registration = getKernelForDispatchKey(DispatchKey::Autograd)) { return {*autograd_registration, "autograd kernel"}; } } // 2.5. For batched backend keys, use kernel from DispatchKey::FuncTorchBatchedDecomposition if available // See Note: [Disjoint AliasKeyset] The order for this alias key doesn't matter if (isIncludedInAlias(dispatch_key, DispatchKey::FuncTorchBatchedDecomposition)) { if (auto batched_registration = getKernelForDispatchKey(DispatchKey::FuncTorchBatchedDecomposition)) { return {*batched_registration, "batched kernel"}; } } // 3. Backend fallback auto dispatch_ix = getDispatchTableIndexForDispatchKey(dispatch_key); if (dispatch_ix < 0) { return {missingKernel(), "backend fallback not registered on mobile"}; } if (dispatcher.backendFallbackKernels_[dispatch_ix].kernel.isValid()) { return {dispatcher.backendFallbackKernels_[dispatch_ix], "backend fallback"}; } // 4. Default to error return {missingKernel(), "missing"}; } // synchronizes the dispatch table entry for a given dispatch key // with the current state of kernel registrations in the dispatcher. // note that this is not a complete update, due to relationships between // dispatch keys (e.g. runtime keys and their associated autograd keys, // or alias keys and their associated keysets). // This function should be considered a private helper for updateDispatchTable_() void OperatorEntry::updateDispatchTableEntry_(const c10::Dispatcher& dispatcher, DispatchKey dispatch_key) { const auto dispatch_ix = getDispatchTableIndexForDispatchKey(dispatch_key); if (C10_UNLIKELY(dispatch_ix == -1)) { return; } dispatchTable_[dispatch_ix] = computeDispatchTableEntry(dispatcher, dispatch_key); dispatchKeyExtractor_.setOperatorHasFallthroughForKey(dispatch_key, dispatchTable_[dispatch_ix].isFallthrough()); } // synchronizes the dispatch table entries for a given dispatch key *and its // associated keys* with the current state of kernel registrations in the // dispatcher. // After a kernel has been registered to a dispatch key, a call to this // function will synchronize the dispatcher state. See e.g. registerKernel() void OperatorEntry::updateDispatchTable_(const c10::Dispatcher& dispatcher, DispatchKey dispatch_key) { // Handle Undefined separately since it isn't a runtime key but we have an entry in dispatchTable_. // See Note [Undefined in dispatchTable_] if (dispatch_key == DispatchKey::Undefined) { updateDispatchTableEntry_(dispatcher, dispatch_key); return; } for (auto k : c10::getRuntimeDispatchKeySet(dispatch_key)) { updateDispatchTableEntry_(dispatcher, k); } // Registration to CompositeExplicitAutogradNonFunctional, CompositeExplicitAutograd and CompositeImplicitAutograd should be populated to Undefined. // We cannot do this above since Undefined cannot be represented in DispatchKeySet. if (dispatch_key == DispatchKey::CompositeImplicitAutograd || dispatch_key == DispatchKey::CompositeExplicitAutograd || dispatch_key == DispatchKey::CompositeExplicitAutogradNonFunctional) { updateDispatchTableEntry_(dispatcher, DispatchKey::Undefined); } // Note [Refresh Runtime Autograd entries in dispatchTable_] // Registering to backend key might affect computed entry at its Autograd backend key due to (2.1) & (2.3). // In theory, we should only have to check if the given runtime key has "dense" functionality, // e.g. DispatchKey::CPU (which is composed of DispatchKey::Dense and BackendComponent::CPUBit). // However, there are some backends that should be included in this set that don't have the dense key set. // E.g. DispatchKey::Meta, DispatchKey::MAIA. if (c10::isBackendDispatchKey(dispatch_key)) { DispatchKey autograd_key = getAutogradKeyFromBackend(toBackendComponent(dispatch_key)); updateDispatchTableEntry_(dispatcher, autograd_key); } } // does a complete update of the dispatch table, synchronizing all // runtime dispatch keys with the current state of kernel registrations // in the dispatcher. // Note that we use updateDispatchTable_() to perform our per-key updating, // even though that function is equipped to handle out-of-order updates and // alias key updates, neither of which we send it. This is deliberate - the // current design is more tractable with all updates funneled through a single // per-key update mechanism, than with multiple variations that assume different // invariants. // void OperatorEntry::updateDispatchTableFull_(const c10::Dispatcher& dispatcher) { // Note [Undefined in dispatchTable_] // DispatchKey Undefined is used in runtime: // (1) it gives people place to specify functionality that should run when there are no dispatch keys, // e.g., an op without Tensor inputs or empty TensorList arguments // (2) it would let us remove the explicit error checking code in the dispatch hotpath, and so when // no dispatch keys are available we just slide into the undefined handler which would then raise // the error message. // In the old world of catchAll, the only way to "register" a kernel to Undefined is by registering it to // catchAll. After catchAllKernel_ is removed, Undefined now can get a kernel from either CompositeExplicitAutograd, // or CompositeImplicitAutograd alias key so that we don't break the support. Ideally isIncludedInAlias(Undefined, CompositeImplicitAutograd) // should return true, it returns false because Undefined cannot be represented in a DispatchKeySet. updateDispatchTable_(dispatcher, DispatchKey::Undefined); for (auto k : DispatchKeySet(DispatchKeySet::FULL)) { updateDispatchTable_(dispatcher, k); } } void OperatorEntry::checkInvariants() const { if (schema_) { TORCH_INTERNAL_ASSERT(schema_->schema.operator_name() == name_, dumpState()); dispatchKeyExtractor().checkInvariants(schema_->schema); } TORCH_INTERNAL_ASSERT(kernels_.find(DispatchKey::Undefined) == kernels_.end(), dumpState()); for (const auto& kv : kernels_) { TORCH_INTERNAL_ASSERT(!kv.second.empty(), dumpState()); } for (auto k : DispatchKeySet(DispatchKeySet::FULL)) { auto expected_k = computeDispatchTableEntry(c10::Dispatcher::singleton(), k); auto idx = getDispatchTableIndexForDispatchKey(k); if (C10_UNLIKELY(idx == -1)) { continue; } TORCH_INTERNAL_ASSERT(expected_k._equalsBoxedAndUnboxed(dispatchTable_[idx]), "Canonical state\n~~~~~~~~~~~\n", dumpState(), "\n\n" "Computed table:\n~~~~~~~~~~~\n", dumpComputedTable()); } } std::string OperatorEntry::listAllDispatchKeys() const { std::ostringstream str; str << "["; bool has_kernels = false; for (auto k : DispatchKeySet(DispatchKeySet::FULL)) { auto iter = getDispatchTableIndexForDispatchKey(k); if (iter == -1 || !dispatchTable_[iter].isValid()) { continue; } if (has_kernels) { str << ", "; } str << k; has_kernels = true; } str << "]"; return str.str(); } void OperatorEntry::reportSignatureError(const CppSignature& call_signature, const CppSignatureWithDebug& saved_signature) const { TORCH_CHECK(false, "\nTried to access or call an operator with a wrong signature.\n", " operator: ", (schema_.has_value() ? toString(schema_->schema) : toString(name_)), "\n", " ", (schema_.has_value() ? schema_->debug : "unknown debug info"), "\n", " correct signature: ", saved_signature.signature.name(), "\n", " ", saved_signature.debug, "\n", " accessed/called as: ", call_signature.name(), "\n", "This likely happened in a call to OperatorHandle::typed(). ", "Please make sure that the function signature matches the signature in the operator registration call." ); }; #ifndef STRIP_ERROR_MESSAGES static std::string post_process_dispatch_key_str(std::string dispatch_key) { const std::string substr = "PrivateUse1"; if (substr.size() <= dispatch_key.size() && std::equal(substr.rbegin(), substr.rend(), dispatch_key.rbegin())) { auto privateuse1_backend = get_privateuse1_backend(); if (privateuse1_backend != "privateuseone") { // remove trailing "*PrivateUse1" dispatch_key.erase(dispatch_key.length() - substr.length()); // append the registered backend's name. // AutogradPrivateUse1 -> AutogradFoo auto backend_name = c10::get_privateuse1_backend(); dispatch_key = dispatch_key + backend_name; } } return dispatch_key; } #endif void OperatorEntry::reportError(DispatchKey dispatchKey) const { // If there is an invariant problem, report it now. checkInvariants(); if (report_error_callback_ != nullptr) { report_error_callback_->pyinterpreter()->reportErrorCallback(report_error_callback_->ptr(&report_error_callback_->pyinterpreter()), dispatchKey); // reportErrorCallback should have raised an error TORCH_INTERNAL_ASSERT(false); } if (dispatchKey == DispatchKey::Undefined) { TORCH_CHECK_NOT_IMPLEMENTED(false, "There were no tensor arguments to this function (e.g., you passed an " "empty list of Tensors), but no fallback function is registered for schema ", name_, ". This usually means that this function requires a non-empty list of Tensors, " "or that you (the operator writer) forgot to register a fallback function. " "Available functions are ", listAllDispatchKeys(), ".\n\n", dumpComputedTable()) } TORCH_CHECK_NOT_IMPLEMENTED(false, "Could not run '", name_, "' with arguments", " from the '", post_process_dispatch_key_str(toString(dispatchKey)), "' backend. This could be because " "the operator doesn't exist for this backend, or was omitted during ", "the selective/custom build process (if using custom build). If you are a ", "Facebook employee using PyTorch on mobile, please visit ", "https://fburl.com/ptmfixes for possible resolutions. '", name_, "' is only available for these backends: ", listAllDispatchKeys(), ".\n\n", dumpComputedTable()); } // INSPECTING DISPATCHER STATE // ~~~~~~~~~~~~~~~~~~~~~~~~~~~ // The dumper functions purposely do not check invariants, as you might be using // them to debug situations where the invariants are violated. // Inspect what the computed dispatch table would be (e.g., what // updateDispatchTableFull_ would update the dispatch table to be) std::string OperatorEntry::dumpComputedTable() const { std::ostringstream oss; // Need to handle Undefined separately, because its a runtime key that can't be represented // in a DispatchKeySet. std::vector runtime_keys = {DispatchKey::Undefined}; for (auto k : DispatchKeySet(DispatchKeySet::FULL)) runtime_keys.push_back(k); for (auto k : runtime_keys) { auto kernel_prov = computeDispatchTableEntryWithDebug(c10::Dispatcher::singleton(), k); if (kernel_prov.first.kernel.isValid()) { oss << toString(k) << ": " << (kernel_prov.first.kernel.isFallthrough() ? "fallthrough " : "") << kernel_prov.first.debug << " [" << kernel_prov.second << "]\n"; } } return oss.str(); } void OperatorEntry::setReportErrorCallback_(std::unique_ptr callback) { report_error_callback_ = std::move(callback); } // Inspect the "canonical" information in OperatorEntry. This only prints out // *non-derived* information including kernels registered to alias dispatch keys; // i.e., what the source of truth says about the operator. This dumping function // is appropriate for expect tests. // This WON'T report backend fallbacks. std::string OperatorEntry::dumpState() const { std::ostringstream oss; oss << "name: " << name_ << "\n"; if (schema_) { oss << "schema: " << schema_->schema << "\n"; oss << "debug: " << schema_->debug << "\n"; oss << "alias analysis kind: " << toString(schema_->schema.aliasAnalysis()) << (schema_->schema.isDefaultAliasAnalysisKind() ? " (default)" : "") << "\n"; } else { oss << "schema: (none)\n"; } auto print_kernel = [&](const char* k_desc, const AnnotatedKernelContainer& jts, bool is_alias_key=false) { int64_t i = 0; for (const auto& jt : jts) { oss << k_desc << (is_alias_key ? "[alias]" : "") << (i > 0 ? " (inactive)" : "") << ": " << jt.debug << " :: " << (jt.inferred_function_schema ? toString(*jt.inferred_function_schema) : "(none)") << " [ " << jt.kernel.dumpState() << "]\n"; i++; } }; // Iterate over DispatchKey, not the flat hash map, so we have a stable order for (uint8_t i = 0; i <= static_cast(DispatchKey::EndOfAliasKeys); i++) { auto k = static_cast(i); auto it = kernels_.find(k); if (it != kernels_.end()) { print_kernel(toString(k), it->second, c10::isAliasDispatchKey(k)); } } return oss.str(); } } }