- #pragma once
- #include <c10/macros/Export.h>
- #include <cstdint>
- namespace at::cuda {
- // enqueues a kernel that spins for the specified number of cycles
- TORCH_CUDA_CU_API void sleep(int64_t cycles);
- // flushes instruction cache for ROCm; no-op for CUDA
- TORCH_CUDA_CU_API void flush_icache();
- } // namespace at::cuda
|