Guest User

Untitled

a guest
Dec 18th, 2014
185
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 3.05 KB | None | 0 0
  1. // ***********************************************************************
  2. //
  3. // Demo program for education in subject
  4. // Computer Architectures and Paralel Systems.
  5. // Petr Olivka, dep. of Computer Science, FEI, VSB-TU Ostrava
  6. //
  7. // Example of CUDA Technology Usage.
  8. // Manipulation with prepared image.
  9. //
  10. // ***********************************************************************
  11.  
  12. #include <cuda_runtime.h>
  13. #include <stdio.h>
  14.  
  15. // Every threads identifies its position in grid and in block and modify image
  16. __global__ void kernel_animation( uchar4 *pic, int sizex, int sizey )
  17. {
  18.  
  19. // X,Y coordinates
  20. int y = blockDim.y * blockIdx.y + threadIdx.y;
  21. int x = blockDim.x * blockIdx.x + threadIdx.x;
  22. if ( x >= sizex ) return;
  23. if ( y >= sizey ) return;
  24.  
  25. // Point [x,y] selection from image
  26. uchar4 bgr = pic[ y * sizex + x ];
  27.  
  28. // Color rotation inside block
  29. int x2 = blockDim.x / 2;
  30. int y2 = blockDim.y / 2;
  31. int px = __sad( x2, threadIdx.x, 0 ); // abs function
  32. int py = __sad( y2, threadIdx.y, 0 );
  33.  
  34. if ( px < x2 * ( y2 - py ) / y2 )
  35. {
  36. uchar4 tmp = bgr;
  37. bgr.x = tmp.y;
  38. bgr.y = tmp.z;
  39. bgr.z = tmp.x;
  40. }
  41.  
  42. // Store point [x,y] back to image
  43. pic[ y * sizex + x ] = bgr;
  44.  
  45. uchar4 bgr = { 255, 255, 0 }; // zluta
  46.  
  47. //Trojuhelnik dolu
  48. if ((x+y) <= sizex+sizex/2 && (x+(sizex/2)>=y) && y > sizey/2)
  49. {
  50. bgr.x = bgr.z = 0; //zelena
  51. }
  52.  
  53. //Trojuhelnik nahoru
  54. if ((x+y>=sizex/2) && (x-(sizex/2)<=y) && y < sizey/2)
  55. {
  56. bgr.x = bgr.z = 0; //zelena
  57. }
  58.  
  59. //Trojuhelnik do prava
  60. if ( (x-(sizex/2)<=y) && (x+y) <= sizex+sizex/2 && x> sizex/2)
  61. {
  62. bgr.x = bgr.y = bgr.z = 0; //cerna
  63. }
  64.  
  65. //Trojuhelnik do leva
  66. if ( (x+y>=sizex/2) && (x+(sizex/2)>=y ) && x <= sizex/2)
  67. {
  68. bgr.x = bgr.y = bgr.z = 0; //cerna
  69. }
  70.  
  71. }
  72.  
  73. void run_animation( uchar4 *pic, int sizex, int sizey, int blockx, int blocky )
  74. {
  75. cudaError_t cerr;
  76.  
  77. // Memory allocation in GPU device
  78. uchar4 *cudaPic;
  79. cerr = cudaMalloc( &cudaPic, sizex * sizey * sizeof( uchar4 ) );
  80. if ( cerr != cudaSuccess )
  81. printf( "CUDA Error [%d] - '%s'\n", __LINE__, cudaGetErrorString( cerr ) );
  82.  
  83. // Copy data to GPU device
  84. cerr = cudaMemcpy( cudaPic, pic, sizex * sizey * sizeof( uchar4 ), cudaMemcpyHostToDevice );
  85. if ( cerr != cudaSuccess )
  86. printf( "CUDA Error [%d] - '%s'\n", __LINE__, cudaGetErrorString( cerr ) );
  87.  
  88. // Grid creation with computed organization
  89. dim3 mrizka( ( sizex + blockx - 1 ) / blockx, ( sizey + blocky - 1 ) / blocky );
  90. kernel_animation<<< mrizka, dim3( blockx, blocky ) >>>( cudaPic, sizex, sizey );
  91.  
  92. if ( ( cerr = cudaGetLastError() ) != cudaSuccess )
  93. printf( "CUDA Error [%d] - '%s'\n", __LINE__, cudaGetErrorString( cerr ) );
  94.  
  95. // Copy data from GPU device to PC
  96. cerr = cudaMemcpy( pic, cudaPic, sizex * sizey * sizeof( uchar4 ), cudaMemcpyDeviceToHost );
  97. if ( cerr != cudaSuccess )
  98. printf( "CUDA Error [%d] - '%s'\n", __LINE__, cudaGetErrorString( cerr ) );
  99.  
  100. // Free memory
  101. cudaFree( cudaPic );
  102.  
  103. // For printf
  104. //cudaDeviceSynchronize();
  105.  
  106. }
Advertisement
Add Comment
Please, Sign In to add comment