14 lines
319 B
C
14 lines
319 B
C
|
#pragma once
|
||
|
#include <c10/macros/Export.h>
|
||
|
#include <cstdint>
|
||
|
|
||
|
namespace at::cuda {
|
||
|
|
||
|
// enqueues a kernel that spins for the specified number of cycles
|
||
|
TORCH_CUDA_CU_API void sleep(int64_t cycles);
|
||
|
|
||
|
// flushes instruction cache for ROCm; no-op for CUDA
|
||
|
TORCH_CUDA_CU_API void flush_icache();
|
||
|
|
||
|
} // namespace at::cuda
|