mirror of
https://github.com/stevenrobertson/cuburn.git
synced 2025-02-05 11:40:04 -05:00
Remove outdated MemBench stuff
This commit is contained in:
parent
94c453d153
commit
6f3c27007a
@ -240,49 +240,3 @@ def render(features, cps):
|
||||
abuf = cuda.from_device_like(obufd, abuf)
|
||||
return abuf, dbuf
|
||||
|
||||
|
||||
|
||||
# TODO: find a better place to stick this code
|
||||
class MemBench(HunkOCode):
|
||||
decls = """
|
||||
__shared__ uint32_t coord[512];
|
||||
"""
|
||||
|
||||
defs_tmpl = Template("""
|
||||
__global__
|
||||
void iter{{W}}(mwc_st *mwcs, uint32_t *buf) {
|
||||
mwc_st rctx = mwcs[gtid()];
|
||||
|
||||
int mask = (1 << {{W}}) - 1;
|
||||
int smoff = threadIdx.x >> {{W}};
|
||||
int writer = (threadIdx.x & mask) == 0;
|
||||
|
||||
for (int i = 0; i < 1024 * 32; i++) {
|
||||
if (writer)
|
||||
coord[smoff] = mwc_next(&rctx) & 0x7ffffff; // 512MB / 4 bytes
|
||||
__syncthreads();
|
||||
uint32_t *dst = buf + (coord[smoff] + (threadIdx.x & mask));
|
||||
uint32_t val = mwc_next(&rctx);
|
||||
asm("st.global.u32 [%0], %1;" :: "l"(dst), "r"(val));
|
||||
}
|
||||
}
|
||||
""")
|
||||
|
||||
@property
|
||||
def defs(self):
|
||||
return '\n'.join([self.defs_tmpl.substitute(W=w) for w in range(8)])
|
||||
|
||||
def membench():
|
||||
code = assemble_code(BaseCode, mwc.MWC, MemBench())
|
||||
mod = SourceModule(code)
|
||||
|
||||
buf = cuda.mem_alloc(512 << 20)
|
||||
seeds = mwc.MWC.make_seeds(512 * 21)
|
||||
|
||||
for w in range(8):
|
||||
fun = mod.get_function('iter%d' % w)
|
||||
print 'Launching with W=%d' % w
|
||||
t = fun(cuda.In(seeds), buf,
|
||||
block=(512, 1, 1), grid=(21, 1), time_kernel=True)
|
||||
print 'Completed in %g' % t
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user