mirror of
				https://github.com/stevenrobertson/cuburn.git
				synced 2025-11-04 02:10:45 -05:00 
			
		
		
		
	Add an important comment
This commit is contained in:
		@ -190,8 +190,11 @@ iter(uint64_t out_ptr, uint64_t atom_ptr,
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
{{if not chaos_used}}
 | 
					{{if not chaos_used}}
 | 
				
			||||||
    // Shared memory size can be reduced by a factor of four using a slower
 | 
					    // Shared memory size can be reduced by a factor of four using a slower
 | 
				
			||||||
    // 4-stage reduce, but on Fermi hardware shmem use isn't a bottleneck
 | 
					    // 4-stage reduce, but on Fermi hardware shmem use isn't a bottleneck.
 | 
				
			||||||
    __shared__ float swap[{{4*NTHREADS}}];
 | 
					    __shared__ float swap[{{4*NTHREADS}}];
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    // Cooperative branch selection, used for deciding when all threads in a
 | 
				
			||||||
 | 
					    // warp should share a branch.
 | 
				
			||||||
    __shared__ float cosel[{{2*NWARPS}}];
 | 
					    __shared__ float cosel[{{2*NWARPS}}];
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    // This is normally done after the swap-sync in the main loop
 | 
					    // This is normally done after the swap-sync in the main loop
 | 
				
			||||||
 | 
				
			|||||||
		Reference in New Issue
	
	Block a user