From 6938ac715b9d4b48662f6552894427fd5e07cf4c Mon Sep 17 00:00:00 2001 From: Steven Robertson Date: Sun, 6 Jan 2013 21:58:14 -0800 Subject: [PATCH] Add an important comment --- cuburn/code/iter.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/cuburn/code/iter.py b/cuburn/code/iter.py index d9b5477..df3085b 100644 --- a/cuburn/code/iter.py +++ b/cuburn/code/iter.py @@ -190,8 +190,11 @@ iter(uint64_t out_ptr, uint64_t atom_ptr, {{if not chaos_used}} // Shared memory size can be reduced by a factor of four using a slower - // 4-stage reduce, but on Fermi hardware shmem use isn't a bottleneck + // 4-stage reduce, but on Fermi hardware shmem use isn't a bottleneck. __shared__ float swap[{{4*NTHREADS}}]; + + // Cooperative branch selection, used for deciding when all threads in a + // warp should share a branch. __shared__ float cosel[{{2*NWARPS}}]; // This is normally done after the swap-sync in the main loop