namespace at::cuda { | |
// enqueues a kernel that spins for the specified number of cycles | |
TORCH_CUDA_CU_API void sleep(int64_t cycles); | |
// flushes instruction cache for ROCm; no-op for CUDA | |
TORCH_CUDA_CU_API void flush_icache(); | |
} // namespace at::cuda | |