// using different memory spaces in CUDA // a __device__ or __global__ function runs on the GPU __global__ void use_local_memory_GPU(float in) { float f; f = in; } int main(int argc, char **argv) { use_local_memory_GPU<<<1, 128>>>(2.0f); float h_arr[128]; float *d_arr; cudaMalloc((void **)&d_arr, sizeof(float)*128); }
data:image/s3,"s3://crabby-images/9d645/9d6450ec4e4fa78612b6bd430a1e444f882976be" alt=""
data:image/s3,"s3://crabby-images/8f657/8f657e2fb8d3a44950d5088dee12658d37e28759" alt=""