mirror of
https://github.com/stevenrobertson/cuburn.git
synced 2025-02-05 11:40:04 -05:00
Add an important comment
This commit is contained in:
parent
6aac026a6b
commit
6938ac715b
@ -190,8 +190,11 @@ iter(uint64_t out_ptr, uint64_t atom_ptr,
|
||||
|
||||
{{if not chaos_used}}
|
||||
// Shared memory size can be reduced by a factor of four using a slower
|
||||
// 4-stage reduce, but on Fermi hardware shmem use isn't a bottleneck
|
||||
// 4-stage reduce, but on Fermi hardware shmem use isn't a bottleneck.
|
||||
__shared__ float swap[{{4*NTHREADS}}];
|
||||
|
||||
// Cooperative branch selection, used for deciding when all threads in a
|
||||
// warp should share a branch.
|
||||
__shared__ float cosel[{{2*NWARPS}}];
|
||||
|
||||
// This is normally done after the swap-sync in the main loop
|
||||
|
Loading…
Reference in New Issue
Block a user