#ifndef __RUNTIME_IMPL__ #define __RUNTIME_IMPL__ #include "cudaStatus.h" #include "structures.h" cudaError_t cudaDeviceReset(void); cudaError_t cudaDeviceSynchronize(void); cudaError_t cudaFree(void *devPtr); cudaError_t cudaLaunchKernel(const void *func, dim3 gridDim, dim3 blockDim, void **args, size_t sharedMem, cudaStream_t stream); cudaError_t cudaMalloc(void **devPtr, size_t size); cudaError_t cudaMemcpy(void *dst, const void *src, size_t count, cudaMemcpyKind kind); cudaError_t cudaSetDevice(int device); cudaError_t cudaStreamCopyAttributes(cudaStream_t dst, cudaStream_t src); cudaError_t cudaStreamCreate(cudaStream_t *pStream); cudaError_t cudaStreamDestroy(cudaStream_t stream); cudaError_t cudaStreamSynchronize(cudaStream_t stream); #endif