Add new Hello World in CUDA 🚀

http://computer-graphics.se/hello-world-for-cuda.html Parallel Programming version!
Aniket965 · Oct 7, 2018 · 8a8332f · 8a8332f
1 parent b5fcf7f
commit 8a8332f
Showing 1 changed file with 47 additions and 0 deletions.
diff --git a/CUDA/HelloWorld.cu b/CUDA/HelloWorld.cu
@@ -0,0 +1,47 @@
+// This is the REAL "hello world" for CUDA!
+// It takes the string "Hello ", prints it, then passes it to CUDA
+// with an array of offsets. Then the offsets are added in parallel
+// to produce the string "World!"
+// By Ingemar Ragnemalm 2010
+
+// nvcc hello-world.cu -L /usr/local/cuda/lib -lcudart -o hello-world
+
+#include <stdio.h>
+
+const int N = 16; 
+const int blocksize = 16; 
+
+__global__ 
+void hello(char *a, int *b) 
+{
+	a[threadIdx.x] += b[threadIdx.x];
+}
+
+int main()
+{
+	char a[N] = "Hello \0\0\0\0\0\0";
+	int b[N] = {15, 10, 6, 0, -11, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0};
+
+	char *ad;
+	int *bd;
+	const int csize = N*sizeof(char);
+	const int isize = N*sizeof(int);
+
+	printf("%s", a);
+
+	cudaMalloc( (void**)&ad, csize ); 
+	cudaMalloc( (void**)&bd, isize ); 
+	cudaMemcpy( ad, a, csize, cudaMemcpyHostToDevice ); 
+	cudaMemcpy( bd, b, isize, cudaMemcpyHostToDevice ); 
+
+	dim3 dimBlock( blocksize, 1 );
+	dim3 dimGrid( 1, 1 );
+	hello<<<dimGrid, dimBlock>>>(ad, bd);
+	cudaMemcpy( a, ad, csize, cudaMemcpyDeviceToHost ); 
+	cudaFree( ad );
+	cudaFree( bd );
+
+	printf("%s\n", a);
+	sleep(1);
+	return EXIT_SUCCESS;
+}