blob: 1da32dcc9b202eb442fcca3d8baf3955c0b79831 [file] [log] [blame]
#include <c10/core/DispatchKey.h>
#include <c10/core/DispatchKeySet.h>
#include <unordered_map>
namespace c10 {
const char* toString(BackendComponent t) {
switch (t) {
case BackendComponent::CPUBit:
return "CPUBit";
case BackendComponent::CUDABit:
return "CUDABit";
case BackendComponent::HIPBit:
return "HIPBit";
case BackendComponent::XLABit:
return "XLABit";
case BackendComponent::LazyBit:
return "LazyBit";
case BackendComponent::MetaBit:
return "MetaBit";
case BackendComponent::XPUBit:
return "XPUBit";
case BackendComponent::IPUBit:
return "IPUBit";
case BackendComponent::MPSBit:
return "MPSBit";
case BackendComponent::HPUBit:
return "HPUBit";
case BackendComponent::VEBit:
return "VEBit";
case BackendComponent::PrivateUse1Bit:
return "PrivateUse1Bit";
case BackendComponent::PrivateUse2Bit:
return "PrivateUse2Bit";
case BackendComponent::PrivateUse3Bit:
return "PrivateUse3Bit";
case BackendComponent::InvalidBit:
return "InvalidBit";
default:
return "UNKNOWN_BACKEND_BIT";
}
}
BackendComponent toBackendComponent(DeviceType device_type) {
switch (device_type) {
#define DO_CASE(device, _) \
case DeviceType::device: { \
return toBackendComponent(DispatchKey::device); \
}
C10_FORALL_BACKEND_DEVICE_TYPES(DO_CASE, unused)
#undef DO_CASE
default:
return BackendComponent::InvalidBit;
}
}
const char* toString(DispatchKey t) {
switch (t) {
case DispatchKey::Undefined:
return "Undefined";
case DispatchKey::Dense:
return "Dense";
case DispatchKey::FPGA:
return "FPGA";
case DispatchKey::ORT:
return "ORT";
case DispatchKey::Vulkan:
return "Vulkan";
case DispatchKey::Metal:
return "Metal";
case DispatchKey::Lazy:
return "Lazy";
case DispatchKey::MPS:
return "MPS";
case DispatchKey::HPU:
return "HPU";
case DispatchKey::Quantized:
return "Quantized";
case DispatchKey::CustomRNGKeyId:
return "CustomRNGKeyId";
case DispatchKey::MkldnnCPU:
return "MkldnnCPU";
case DispatchKey::Sparse:
return "Sparse";
case DispatchKey::SparseCsrCPU:
return "SparseCsrCPU";
case DispatchKey::SparseCsrCUDA:
return "SparseCsrCUDA";
case DispatchKey::NestedTensor:
return "NestedTensor";
case DispatchKey::BackendSelect:
return "BackendSelect";
case DispatchKey::Python:
return "Python";
case DispatchKey::Fake:
return "Fake";
case DispatchKey::FuncTorchDynamicLayerBackMode:
return "FuncTorchDynamicLayerBackMode";
case DispatchKey::Functionalize:
return "Functionalize";
case DispatchKey::Named:
return "Named";
case DispatchKey::Conjugate:
return "Conjugate";
case DispatchKey::Negative:
return "Negative";
case DispatchKey::ZeroTensor:
return "ZeroTensor";
case DispatchKey::ADInplaceOrView:
return "ADInplaceOrView";
case DispatchKey::AutogradOther:
return "AutogradOther";
case DispatchKey::AutogradFunctionality:
return "AutogradFunctionality";
case DispatchKey::AutogradNestedTensor:
return "AutogradNestedTensor";
case DispatchKey::Tracer:
return "Tracer";
case DispatchKey::AutocastCPU:
return "AutocastCPU";
case DispatchKey::AutocastXPU:
return "AutocastXPU";
case DispatchKey::AutocastCUDA:
return "AutocastCUDA";
case DispatchKey::FuncTorchBatched:
return "FuncTorchBatched";
case DispatchKey::FuncTorchVmapMode:
return "FuncTorchVmapMode";
case DispatchKey::Batched:
return "Batched";
case DispatchKey::VmapMode:
return "VmapMode";
case DispatchKey::FuncTorchGradWrapper:
return "FuncTorchGradWrapper";
case DispatchKey::DeferredInit:
return "DeferredInit";
case DispatchKey::PythonTLSSnapshot:
return "PythonTLSSnapshot";
// Note [Out-of-tree vmap+grad prototype]
// The following keys are used in the implementation of the out-of-tree
// composable functions transforms (vmap+grad) prototype that lives at
// https://github.com/zou3519/functorch
// We plan on eventually upstreaming the prototype into core, at which
// point it will have a different design that should use fewer keys.
case DispatchKey::FuncTorchDynamicLayerFrontMode:
return "FuncTorchDynamicLayerFrontMode";
case DispatchKey::TESTING_ONLY_GenericWrapper:
return "TESTING_ONLY_GenericWrapper";
case DispatchKey::TESTING_ONLY_GenericMode:
return "TESTING_ONLY_GenericMode";
case DispatchKey::PythonDispatcher:
return "PythonDispatcher";
// Aliases
case DispatchKey::Autograd:
return "Autograd";
case DispatchKey::CompositeImplicitAutograd:
return "CompositeImplicitAutograd";
case DispatchKey::CompositeImplicitAutogradNestedTensor:
return "CompositeImplicitAutogradNestedTensor";
case DispatchKey::CompositeExplicitAutograd:
return "CompositeExplicitAutograd";
case DispatchKey::CompositeExplicitAutogradNonFunctional:
return "CompositeExplicitAutogradNonFunctional";
// Per-backend dispatch keys
default:
auto bc = toBackendComponent(t);
auto fk = toFunctionalityKey(t);
switch (fk) {
#define ENTRY(backend, functionality) \
case BackendComponent::backend##Bit: \
return #functionality #backend;
#define FORALL_BC(dkname, prefix) \
case DispatchKey::dkname: \
switch (bc) { \
C10_FORALL_BACKEND_COMPONENTS(ENTRY, prefix) \
default: \
return #prefix "Unknown"; \
}
C10_FORALL_FUNCTIONALITY_KEYS(FORALL_BC)
default:
switch (bc) {
C10_FORALL_BACKEND_COMPONENTS(ENTRY, Unknown)
default:
return "UnknownUnknown";
}
#undef FORALL_BC
#undef ENTRY
}
}
}
std::ostream& operator<<(std::ostream& str, DispatchKey rhs) {
return str << toString(rhs);
}
std::ostream& operator<<(std::ostream& str, BackendComponent rhs) {
return str << toString(rhs);
}
DispatchKey getAutogradKeyFromBackend(BackendComponent k) {
// We want this to return an autograd key. We're relying on the fact that
// getAutogradRelatedKeySetFromBackend returns an autograd key +
// ADInplaceOrView, and autograd has higher precedence. The core mapping from
// backend -> autograd key lives in `getAutogradRelatedKeySetFromBackend`
// instead of here for performance. `getAutogradRelatedKeySetFromBackend` is a
// hotpath function, and we want to make sure that it doesn't have to
// construct any DispatchKeySets at runtime.
return getAutogradRelatedKeySetFromBackend(k).highestPriorityTypeId();
}
c10::DispatchKey parseDispatchKey(const std::string& k) {
static std::unordered_map<std::string, c10::DispatchKey> key_map = {
{"Undefined", c10::DispatchKey::Undefined},
{"Dense", c10::DispatchKey::Dense},
{"FPGA", c10::DispatchKey::FPGA},
{"ORT", c10::DispatchKey::ORT},
{"MPS", c10::DispatchKey::MPS},
{"Vulkan", c10::DispatchKey::Vulkan},
{"Metal", c10::DispatchKey::Metal},
{"VE", c10::DispatchKey::VE},
{"Meta", c10::DispatchKey::Meta},
{"Quantized", c10::DispatchKey::Quantized},
{"CustomRNGKeyId", c10::DispatchKey::CustomRNGKeyId},
{"MkldnnCPU", c10::DispatchKey::MkldnnCPU},
{"Sparse", c10::DispatchKey::Sparse},
{"SparseCsrCPU", c10::DispatchKey::SparseCsrCPU},
{"SparseCsrCUDA", c10::DispatchKey::SparseCsrCUDA},
{"BackendSelect", c10::DispatchKey::BackendSelect},
{"Python", c10::DispatchKey::Python},
{"PythonTLSSnapshot", c10::DispatchKey::PythonTLSSnapshot},
{"Fake", c10::DispatchKey::Fake},
{"Named", c10::DispatchKey::Named},
{"Conjugate", c10::DispatchKey::Conjugate},
{"Negative", c10::DispatchKey::Negative},
{"ZeroTensor", c10::DispatchKey::ZeroTensor},
{"FuncTorchDynamicLayerBackMode",
c10::DispatchKey::FuncTorchDynamicLayerBackMode},
{"Functionalize", c10::DispatchKey::Functionalize},
{"ADInplaceOrView", c10::DispatchKey::ADInplaceOrView},
{"AutogradOther", c10::DispatchKey::AutogradOther},
{"AutogradFunctionality", c10::DispatchKey::AutogradFunctionality},
{"AutogradNestedTensor", c10::DispatchKey::AutogradNestedTensor},
{"Tracer", c10::DispatchKey::Tracer},
{"AutocastCPU", c10::DispatchKey::AutocastCPU},
{"AutocastXPU", c10::DispatchKey::AutocastXPU},
{"AutocastCUDA", c10::DispatchKey::AutocastCUDA},
{"FuncTorchBatched", c10::DispatchKey::FuncTorchBatched},
{"FuncTorchVmapMode", c10::DispatchKey::FuncTorchVmapMode},
{"Batched", c10::DispatchKey::Batched},
{"VmapMode", c10::DispatchKey::VmapMode},
{"DeferredInit", c10::DispatchKey::DeferredInit},
{"FuncTorchGradWrapper", c10::DispatchKey::FuncTorchGradWrapper},
{"FuncTorchDynamicLayerFrontMode",
c10::DispatchKey::FuncTorchDynamicLayerFrontMode},
{"TESTING_ONLY_GenericWrapper",
c10::DispatchKey::TESTING_ONLY_GenericWrapper},
{"TESTING_ONLY_GenericMode", c10::DispatchKey::TESTING_ONLY_GenericMode},
{"PythonDispatcher", c10::DispatchKey::PythonDispatcher},
{"CPU", c10::DispatchKey::CPU},
{"CUDA", c10::DispatchKey::CUDA},
{"HIP", c10::DispatchKey::HIP},
{"XLA", c10::DispatchKey::XLA},
{"MPS", c10::DispatchKey::MPS},
{"XPU", c10::DispatchKey::XPU},
{"IPU", c10::DispatchKey::IPU},
{"HPU", c10::DispatchKey::HPU},
{"Lazy", c10::DispatchKey::Lazy},
{"NestedTensor", c10::DispatchKey::NestedTensor},
{"NestedTensorCPU", c10::DispatchKey::NestedTensorCPU},
{"NestedTensorCUDA", c10::DispatchKey::NestedTensorCUDA},
{"PrivateUse1", c10::DispatchKey::PrivateUse1},
{"PrivateUse2", c10::DispatchKey::PrivateUse2},
{"PrivateUse3", c10::DispatchKey::PrivateUse3},
{"QuantizedCPU", c10::DispatchKey::QuantizedCPU},
{"QuantizedCUDA", c10::DispatchKey::QuantizedCUDA},
{"QuantizedXPU", c10::DispatchKey::QuantizedXPU},
{"SparseCPU", c10::DispatchKey::SparseCPU},
{"SparseCUDA", c10::DispatchKey::SparseCUDA},
{"SparseHIP", c10::DispatchKey::SparseHIP},
{"SparseXPU", c10::DispatchKey::SparseXPU},
{"SparseVE", c10::DispatchKey::SparseVE},
{"AutogradCPU", c10::DispatchKey::AutogradCPU},
{"AutogradCUDA", c10::DispatchKey::AutogradCUDA},
{"AutogradXLA", c10::DispatchKey::AutogradXLA},
{"AutogradLazy", c10::DispatchKey::AutogradLazy},
{"AutogradMeta", c10::DispatchKey::AutogradMeta},
{"AutogradIPU", c10::DispatchKey::AutogradIPU},
{"AutogradXPU", c10::DispatchKey::AutogradXPU},
{"AutogradMPS", c10::DispatchKey::AutogradMPS},
{"AutogradHPU", c10::DispatchKey::AutogradHPU},
{"AutogradPrivateUse1", c10::DispatchKey::AutogradPrivateUse1},
{"AutogradPrivateUse2", c10::DispatchKey::AutogradPrivateUse2},
{"AutogradPrivateUse3", c10::DispatchKey::AutogradPrivateUse3},
{"Autograd", c10::DispatchKey::Autograd},
{"CompositeImplicitAutograd",
c10::DispatchKey::CompositeImplicitAutograd},
{"CompositeImplicitAutogradNestedTensor",
c10::DispatchKey::CompositeImplicitAutogradNestedTensor},
{"CompositeExplicitAutograd",
c10::DispatchKey::CompositeExplicitAutograd},
{"CompositeExplicitAutogradNonFunctional",
c10::DispatchKey::CompositeExplicitAutogradNonFunctional},
};
auto it = key_map.find(k);
TORCH_CHECK(it != key_map.end(), "could not parse dispatch key: ", k);
return it->second;
}
} // namespace c10