#pragma once #include namespace torch { static constexpr size_t MAX_CUDA_DEVICES = 64; using device_set = std::bitset; }