Skip to content

Commit

Permalink
BSLab: new profile.txt with NUM_THREADS = 4*WARP_SIZE for mtf_cuda_th…
Browse files Browse the repository at this point in the history
…read[by4]
  • Loading branch information
Bulat-Ziganshin committed Jun 18, 2016
1 parent 6b1236d commit d28523d
Show file tree
Hide file tree
Showing 3 changed files with 3,669 additions and 6,392 deletions.
2 changes: 1 addition & 1 deletion app_bslab/bslab.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -350,7 +350,7 @@ int main (int argc, char **argv)
time_run ("mtf_cuda_thread ", [&] {mtf_cuda_thread <CHUNK> <<<(inbytes-1)/(CHUNK*WARP_SIZE)+1, WARP_SIZE>>> (d_inbuf, d_outbuf, inbytes, CHUNK);});
time_run ("mtf_cuda_thread_by4 ", [&] {mtf_cuda_thread_by4<CHUNK> <<<(inbytes-1)/(CHUNK*WARP_SIZE)+1, WARP_SIZE>>> (d_inbuf, d_outbuf, inbytes, CHUNK);});

const int NUM_THREADS = 1*WARP_SIZE;
const int NUM_THREADS = 4*WARP_SIZE;
time_run ("mtf_cuda_thread<8> ", [&] {mtf_cuda_thread <CHUNK,NUM_THREADS,8> <<<(inbytes-1)/(CHUNK*NUM_THREADS)+1, NUM_THREADS>>> (d_inbuf, d_outbuf, inbytes, CHUNK);});
time_run ("mtf_cuda_thread<16> ", [&] {mtf_cuda_thread <CHUNK,NUM_THREADS,16> <<<(inbytes-1)/(CHUNK*NUM_THREADS)+1, NUM_THREADS>>> (d_inbuf, d_outbuf, inbytes, CHUNK);});
time_run ("mtf_cuda_thread<32> ", [&] {mtf_cuda_thread <CHUNK,NUM_THREADS,32> <<<(inbytes-1)/(CHUNK*NUM_THREADS)+1, NUM_THREADS>>> (d_inbuf, d_outbuf, inbytes, CHUNK);});
Expand Down
Loading

0 comments on commit d28523d

Please sign in to comment.