diff --git a/cuburn/code/output.py b/cuburn/code/output.py index 611b4b0..9126e30 100644 --- a/cuburn/code/output.py +++ b/cuburn/code/output.py @@ -29,6 +29,6 @@ __global__ void f32_to_u8( int idst = dstride * y + x; dst[idst] = out; - rctxs[rb_incr(rb->head, tid)] = rctx; + rctxs[rb_incr(rb->tail, tid)] = rctx; } ''')