mirror of
https://github.com/stevenrobertson/cuburn.git
synced 2025-02-05 11:40:04 -05:00
Add an important comment
This commit is contained in:
parent
6aac026a6b
commit
6938ac715b
@ -190,8 +190,11 @@ iter(uint64_t out_ptr, uint64_t atom_ptr,
|
|||||||
|
|
||||||
{{if not chaos_used}}
|
{{if not chaos_used}}
|
||||||
// Shared memory size can be reduced by a factor of four using a slower
|
// Shared memory size can be reduced by a factor of four using a slower
|
||||||
// 4-stage reduce, but on Fermi hardware shmem use isn't a bottleneck
|
// 4-stage reduce, but on Fermi hardware shmem use isn't a bottleneck.
|
||||||
__shared__ float swap[{{4*NTHREADS}}];
|
__shared__ float swap[{{4*NTHREADS}}];
|
||||||
|
|
||||||
|
// Cooperative branch selection, used for deciding when all threads in a
|
||||||
|
// warp should share a branch.
|
||||||
__shared__ float cosel[{{2*NWARPS}}];
|
__shared__ float cosel[{{2*NWARPS}}];
|
||||||
|
|
||||||
// This is normally done after the swap-sync in the main loop
|
// This is normally done after the swap-sync in the main loop
|
||||||
|
Loading…
Reference in New Issue
Block a user