Advertisement
Guest User

safasf

a guest
Apr 25th, 2018
60
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
C++ 0.53 KB | None | 0 0
  1. __global__ void kernel_res_nested(TYPE *A, TYPE *B, TYPE *D, TYPE *result, TYPE size, TYPE resultSize){
  2.  
  3.     int i = blockDim.x * blockIdx.x + threadIdx.x;
  4.     int j = blockDim.y * blockIdx.y + threadIdx.y;
  5.  
  6.     TYPE rtmp = result[i];
  7.  
  8.     if( i > 0 && i < resultSize - 1){
  9.  
  10.         TYPE start = (i >= size) ? (i % size ) + 1 : 0;
  11.         TYPE end = (i + 1) / 2;
  12.  
  13.         if(j >= start && j <= end ){
  14.             rtmp += ( A[j] + A[i - j] ) * ( B[j] + B[i - j] ) - ( D[j] + D[i - j] );
  15.         }
  16.     }
  17.  
  18.     result[i] = rtmp;
  19. }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement