Make code more portable

2025-08-02 05:25:39 -04:00 · 2011-05-03 17:12:12 -04:00
parent eeff0a4d4f
commit c605815130
5 changed files with 197 additions and 168 deletions
--- a/cuburn/_pyflam3_hacks.py
+++ b/cuburn/_pyflam3_hacks.py
@ -0,0 +1,170 @@
+"""
+Fr0st's pyflam3 bindings omit the ctypes fields for the xform structure.
+This lets a given fr0st release be compatible with a much larger range
+of flam3 versions, but we need access to that data.
+
+Importing this module monkey-patches the fr0st module to include those
+fields, and also provides a few other functions not needed in fr0st.
+If flam3 or smoulder eventually includes padded xform structuress for
+wider compatibility, or I bother to write a parser for flam3.h,
+this may become unnecessary.
+"""
+
+from ctypes import *
+from fr0stlib.pyflam3 import constants
+from fr0stlib.pyflam3._flam3 import *
+
+flam3_nvariations = constants.flam3_nvariations = 99
+
+BaseXForm._fields_ = [('var', c_double * flam3_nvariations)
+               , ('c', (c_double * 2) * 3) # TODO: ctypes 2D arrays?
+               , ('post', (c_double * 2) * 3)
+               , ('density', c_double)
+               , ('color', c_double)
+               , ('color_speed', c_double)
+               , ('animate', c_double)
+               , ('opacity', c_double)
+               , ('vis_adjusted', c_double)
+               , ('padding', c_int)
+               , ('wind', c_double * 2)
+               , ('precalc_angles_flag', c_int)
+               , ('precalc_atan_xy_flag', c_int)
+               , ('precalc_atan_yx_flag', c_int)
+               , ('has_preblur', c_double)
+               , ('has_post', c_int)
+               , ('blob_low', c_double)
+               , ('blob_high', c_double)
+               , ('blob_waves', c_double)
+               , ('pdj_a', c_double)
+               , ('pdj_b', c_double)
+               , ('pdj_c', c_double)
+               , ('pdj_d', c_double)
+               , ('fan2_x', c_double)
+               , ('fan2_y', c_double)
+               , ('rings2_val', c_double)
+               , ('perspective_angle', c_double)
+               , ('perspective_dist', c_double)
+               , ('julian_power', c_double)
+               , ('julian_dist', c_double)
+               , ('juliascope_power', c_double)
+               , ('juliascope_dist', c_double)
+               , ('radial_blur_angle', c_double)
+               , ('pie_slices', c_double)
+               , ('pie_rotation', c_double)
+               , ('pie_thickness', c_double)
+               , ('ngon_sides', c_double)
+               , ('ngon_power', c_double)
+               , ('ngon_circle', c_double)
+               , ('ngon_corners', c_double)
+               , ('curl_c1', c_double)
+               , ('curl_c2', c_double)
+               , ('rectangles_x', c_double)
+               , ('rectangles_y', c_double)
+               , ('amw_amp', c_double)
+               , ('disc2_rot', c_double)
+               , ('disc2_twist', c_double)
+               , ('super_shape_rnd', c_double)
+               , ('super_shape_m', c_double)
+               , ('super_shape_n1', c_double)
+               , ('super_shape_n2', c_double)
+               , ('super_shape_n3', c_double)
+               , ('super_shape_holes', c_double)
+               , ('flower_petals', c_double)
+               , ('flower_holes', c_double)
+               , ('conic_eccentricity', c_double)
+               , ('conic_holes', c_double)
+               , ('parabola_height', c_double)
+               , ('parabola_width', c_double)
+               , ('bent2_x', c_double)
+               , ('bent2_y', c_double)
+               , ('bipolar_shift', c_double)
+               , ('cell_size', c_double)
+               , ('cpow_r', c_double)
+               , ('cpow_i', c_double)
+               , ('cpow_power', c_double)
+               , ('curve_xamp', c_double)
+               , ('curve_yamp', c_double)
+               , ('curve_xlength', c_double)
+               , ('curve_ylength', c_double)
+               , ('escher_beta', c_double)
+               , ('lazysusan_spin', c_double)
+               , ('lazysusan_space', c_double)
+               , ('lazysusan_twist', c_double)
+               , ('lazysusan_x', c_double)
+               , ('lazysusan_y', c_double)
+               , ('modulus_x', c_double)
+               , ('modulus_y', c_double)
+               , ('oscope_separation', c_double)
+               , ('oscope_frequency', c_double)
+               , ('oscope_amplitude', c_double)
+               , ('oscope_damping', c_double)
+               , ('popcorn2_x', c_double)
+               , ('popcorn2_y', c_double)
+               , ('popcorn2_c', c_double)
+               , ('separation_x', c_double)
+               , ('separation_xinside', c_double)
+               , ('separation_y', c_double)
+               , ('separation_yinside', c_double)
+               , ('split_xsize', c_double)
+               , ('split_ysize', c_double)
+               , ('splits_x', c_double)
+               , ('splits_y', c_double)
+               , ('stripes_space', c_double)
+               , ('stripes_warp', c_double)
+               , ('wedge_angle', c_double)
+               , ('wedge_hole', c_double)
+               , ('wedge_count', c_double)
+               , ('wedge_swirl', c_double)
+               , ('wedge_julia_angle', c_double)
+               , ('wedge_julia_count', c_double)
+               , ('wedge_julia_power', c_double)
+               , ('wedge_julia_dist', c_double)
+               , ('wedge_sph_angle', c_double)
+               , ('wedge_sph_count', c_double)
+               , ('wedge_sph_hole', c_double)
+               , ('wedge_sph_swirl', c_double)
+               , ('whorl_inside', c_double)
+               , ('whorl_outside', c_double)
+               , ('waves2_freqx', c_double)
+               , ('waves2_scalex', c_double)
+               , ('waves2_freqyx', c_double)
+               , ('waves2_scaley', c_double)
+               , ('auger_sym', c_double)
+               , ('auger_weight', c_double)
+               , ('auger_freq', c_double)
+               , ('auger_scale', c_double)
+               , ('flux_spread', c_double)
+               , ('mobius_re_a', c_double)
+               , ('mobius_im_a', c_double)
+               , ('mobius_re_b', c_double)
+               , ('mobius_im_b', c_double)
+               , ('mobius_re_c', c_double)
+               , ('mobius_im_c', c_double)
+               , ('persp_vsin', c_double)
+               , ('persp_vfcos', c_double)
+               , ('julian_rN', c_double)
+               , ('julian_cN', c_double)
+               , ('juliascope_rN', c_double)
+               , ('juliascope_cN', c_double)
+               , ('wedgeJulia_rN', c_double)
+               , ('wedgeJulia_cn', c_double)
+               , ('wedgeJulia_cf', c_double)
+               , ('radialBlur_spinvar', c_double)
+               , ('radialBlur_zoomvar', c_double)
+               , ('waves_dx2', c_double)
+               , ('waves_dy2', c_double)
+               , ('disc2_sinadd', c_double)
+               , ('disc2_cosadd', c_double)
+               , ('disc2_timespi', c_double)
+               , ('super_shape_pm_4', c_double)
+               , ('super_shape_pneg1_n1', c_double)
+               , ('num_active_vars', c_int)
+               , ('active_var_weights', c_double * flam3_nvariations)
+               , ('varFunc', c_int * flam3_nvariations)
+               , ('motion_freq', c_int)
+               , ('motion_func', c_int)
+               , ('motion', POINTER(BaseXForm))
+               , ('num_motion', c_int)
+               # It seems I'm missing something in the current version.
+               , ('mysterious_padding', c_double * 2) ]
+
--- a/cuburn/code/iter.py
+++ b/cuburn/code/iter.py
@ -130,7 +130,7 @@ void iter(mwc_st *msts, iter_info *infos, float *accbuf, float *denbuf) {
                packer = self.packer.view('info'))


-def silly(features, cps):
+def render(features, cps):
    nsteps = 1000
    abuf = np.zeros((1024, 1024, 4), dtype=np.float32)
    dbuf = np.zeros((1024, 1024), dtype=np.float32)
--- a/cuburn/code/variations.py
+++ b/cuburn/code/variations.py
@ -35,7 +35,7 @@ var(5, 'polar', """

 var(10, 'hyperbolic', """
    float a = atan2f(tx, ty);
-    float r = sqrt(tx*tx + ty*ty) + 1e-20;
+    float r = sqrt(tx*tx + ty*ty) + 1e-20f;
    ox += w * sinf(a) / r;
    oy += w * cosf(a) * r;
    """)
@ -46,7 +46,7 @@ var(33, 'juliascope', """
    float t_rnd = truncf(mwc_next_01(rctx) * fabsf(power));
    // TODO: don't draw the extra random number
    if (mwc_next(rctx) & 1) ang = -ang;
-    float tmpr = (2 * M_PI * t_rnd + ang) / power;
+    float tmpr = (2.0f * M_PI * t_rnd + ang) / power;

    float cn = {{px.get('xf.juliascope_dist / xf.juliascope_power / 2',
                         'juscope_cn')}};
--- a/cuburn/render.py
+++ b/cuburn/render.py
@ -26,103 +26,6 @@ class Genome(pyflam3.Genome):
        dens /= np.sum(dens)
        self.norm_density = [np.sum(dens[:i+1]) for i in range(len(dens))]

-class XForm(object):
-    """
-    A Python structure (*not* a ctypes wrapper) storing an xform. There are
-    a few differences between the meaning of properties on this object and
-    those of the C version; they are noted below.
-    """
-    def __init__(self, **kwargs):
-        read_affine = lambda c: [[c[0], c[1]], [c[2], c[3]], [c[4], c[5]]]
-        self.coefs = read_affine(map(float, kwargs.pop('coefs').split()))
-        if 'post' in kwargs:
-            self.post = read_affine(map(float, kwargs.pop('post').split()))
-        # TODO: more verification, detection of unknown variables, etc
-        for k, v in kwargs.items():
-            setattr(self, k, float(v))
-
-    # ctypes was being a pain. just parse the string.
-    @classmethod
-    def parse(cls, cp):
-        flame_str = flam3_print_to_string(byref(cp))
-        xforms = []
-        for line in flame_str.split('\n'):
-            if not line.strip().startswith('<xform'):
-                continue
-            props = dict(re.findall(r'(\w*)="([^"]*)"', line))
-            xforms.append(cls(**props))
-        # Set cumulative xform weight
-        xforms[0].cweight = xforms[0].weight
-        for i in range(1, len(xforms)):
-            xforms[i].cweight = xforms[i].weight + xforms[i-1].cweight
-        xforms[-1].cweight = 1.0
-        return xforms
-
-class _Frame(pyflam3.Frame):
-    """
-    ctypes flam3_frame object used for genome interpolation and
-    spatial filter creation
-    """
-    def __init__(self, genomes, *args, **kwargs):
-        pyflam3.Frame.__init__(self, *args, **kwargs)
-        self.genomes = (BaseGenome * len(genomes))()
-        for i in range(len(genomes)):
-            memmove(byref(self.genomes[i]), byref(genomes[i]),
-                    sizeof(BaseGenome))
-        self.ngenomes = len(genomes)
-
-        # TODO: allow user to override this
-        self.pixel_aspect_ratio = 1.0
-
-    def interpolate(self, time, stagger=0, cp=None):
-        cp = cp or BaseGenome()
-        flam3_interpolate(self.genomes, self.ngenomes, time,
-                          stagger, byref(cp))
-        return cp
-
-class Frame(object):
-    """
-    Handler for a single frame of a rendered genome.
-    """
-    def __init__(self, _frame, time):
-        self._frame = _frame
-        self.center_cp = self._frame.interpolate(time)
-
-    def upload_data(self, ctx, filters, time):
-        """
-        Prepare and upload the data needed to render this frame to the device.
-        """
-        center = self.center_cp
-        ncps = center.nbatches * center.ntemporal_samples
-
-        # TODO: isn't this leaking xforms from C all over the place?
-        stream = StringIO()
-        cp_list = []
-
-        for batch_idx in range(center.nbatches):
-            for time_idx in range(center.ntemporal_samples):
-                idx = time_idx + batch_idx * center.nbatches
-                interp_time = time + filters.temporal_deltas[idx]
-                cp = self._frame.interpolate(interp_time)
-                cp_list.append(cp)
-
-                cp.camera = Camera(self._frame, cp, filters)
-                cp.nsamples = (cp.camera.sample_density *
-                               center.width * center.height) / ncps
-
-
-        print "Expected writes:", (
-                cp.camera.sample_density * center.width * center.height)
-        min_time = min(filters.temporal_deltas)
-        max_time = max(filters.temporal_deltas)
-        for i, cp in enumerate(cp_list):
-            cp.norm_time = (filters.temporal_deltas[i] - min_time) / (
-                            max_time - min_time)
-            CPDataStream.pack_into(ctx, stream, frame=self, cp=cp, cp_idx=idx)
-        PaletteLookup.upload_palette(ctx, self, cp_list)
-        stream.seek(0)
-        IterThread.upload_cp_stream(ctx, stream.read(), ncps)
-
 class Animation(object):
    """
    Control structure for rendering a series of frames.
@ -142,57 +45,13 @@ class Animation(object):
    interpolated sequence between one or two genomes.
    """
    def __init__(self, genomes, ngenomes = None):
-        # _frame is the ctypes frame object used only for interpolation
-        self._frame = _Frame(genomes)
-
-        # Use the same set of filters throughout the anim, a la flam3
-        self.filters = Filters(self._frame, genomes[0])
-        self.features = Features(genomes, self.filters)
+        self.features = Features(genomes)

    def compile(self):
        pass
    def render_frame(self, time=0):
        pass

-class Filters(object):
-    def __init__(self, frame, cp):
-        # Use one oversample per filter set, even over multiple timesteps
-        self.oversample = frame.genomes[0].spatial_oversample
-
-        # Ugh. I'd really like to replace this mess
-        spa_filt_ptr = POINTER(c_double)()
-        spa_width = flam3_create_spatial_filter(byref(frame),
-                                                flam3_field_both,
-                                                byref(spa_filt_ptr))
-        if spa_width < 0:
-            raise EnvironmentError("flam3 call failed")
-        self.spatial = np.asarray([[spa_filt_ptr[y*spa_width+x] for x in
-            range(spa_width)] for y in range(spa_width)], dtype=np.double)
-        self.spatial_width = spa_width
-        flam3_free(spa_filt_ptr)
-
-        tmp_filt_ptr = POINTER(c_double)()
-        tmp_deltas_ptr = POINTER(c_double)()
-        steps = cp.nbatches * cp.ntemporal_samples
-        self.temporal_sum = flam3_create_temporal_filter(
-                steps,
-                cp.temporal_filter_type,
-                cp.temporal_filter_exp,
-                cp.temporal_filter_width,
-                byref(tmp_filt_ptr),
-                byref(tmp_deltas_ptr))
-        self.temporal = np.asarray([tmp_filt_ptr[i] for i in range(steps)],
-                                   dtype=np.double)
-        flam3_free(tmp_filt_ptr)
-        self.temporal_deltas = np.asarray(
-                [tmp_deltas_ptr[i] for i in range(steps)], dtype=np.double)
-        flam3_free(tmp_deltas_ptr)
-
-        # TODO: density estimation
-        self.gutter = (spa_width - self.oversample) / 2
-
-
-
 class Features(object):
    """
    Determine features and constants required to render a particular set of
@ -212,7 +71,7 @@ class Features(object):
    # performance too much. Power-of-two, please.
    palette_height = 16

-    def __init__(self, genomes, flt):
+    def __init__(self, genomes):
        any = lambda l: bool(filter(None, map(l, genomes)))
        self.max_ntemporal_samples = max(
                [cp.nbatches * cp.ntemporal_samples for cp in genomes])
@ -227,15 +86,6 @@ class Features(object):
        if any(lambda cp: cp.final_xform_enable):
            raise NotImplementedError("Final xform")

-        # Histogram (and log-density copy) width and height
-        self.hist_width  = flt.oversample * genomes[0].width  + 2 * flt.gutter
-        self.hist_height = flt.oversample * genomes[0].height + 2 * flt.gutter
-        # Histogram stride, for better filtering. This code assumes the
-        # 128-byte L1 cache line width of Fermi devices, and a 16-byte
-        # histogram bucket size. TODO: detect these things programmatically,
-        # particularly the histogram bucket size, which may be split soon
-        self.hist_stride = 8 * int(math.ceil(self.hist_width / 8.0))
-
 class XFormFeatures(object):
    def __init__(self, xforms, xform_id):
        self.id = xform_id
@ -248,7 +98,7 @@ class XFormFeatures(object):

 class Camera(object):
    """Viewport and exposure."""
-    def __init__(self, frame, cp, filters):
+    def __init__(self, frame, cp):
        # Calculate the conversion matrix between the IFS space (xform
        # coordinates) and the sampling lattice (bucket addresses)
        # TODO: test this code (against compute_camera?)
@ -262,8 +112,6 @@ class Camera(object):
        self.ppu = Point(
            cp.pixels_per_unit * scale / frame.pixel_aspect_ratio,
            cp.pixels_per_unit * scale)
-        # extra shifts applied due to gutter
-        gutter = filters.gutter / (cp.spatial_oversample * self.ppu)
        cornerLL = center - (size / (2 * self.ppu))
        self.lower_bounds = cornerLL - gutter
        self.upper_bounds = cornerLL + (size / self.ppu) + gutter
@ -271,3 +119,4 @@ class Camera(object):
        self.norm_offset = -self.norm_scale * self.lower_bounds
        self.idx_scale = size * self.norm_scale
        self.idx_offset = size * self.norm_offset
+
--- a/main.py
+++ b/main.py
@ -11,7 +11,7 @@

 import os
 import sys
-os.environ['PATH'] = '/usr/x86_64-pc-linux-gnu/gcc-bin/4.4.5:' + os.environ['PATH']
+
 from pprint import pprint
 from ctypes import *

@ -19,28 +19,38 @@ import numpy as np
 np.set_printoptions(precision=5, edgeitems=20)
 import scipy

+import pyglet
+import pycuda.autoinit
+
 from fr0stlib.pyflam3 import *
 from fr0stlib.pyflam3._flam3 import *

-import pyglet
-window = pyglet.window.Window(1024, 1024)
-import pycuda.gl.autoinit
-
+import cuburn._pyflam3_hacks
 from cuburn.render import *
 from cuburn.code.mwc import MWCTest
-from cuburn.code.iter import silly, membench
+from cuburn.code.iter import render, membench

+# Required on my system; CUDA doesn't yet work with GCC 4.5
+os.environ['PATH'] = ('/usr/x86_64-pc-linux-gnu/gcc-bin/4.4.5:'
+                     + os.environ['PATH'])

 def main(args):
-    #MWCTest.test_mwc()
-    with open(args[-1]) as fp:
+    if '-t' in args:
+        MWCTest.test_mwc()
+        membench()
+
+    window = pyglet.window.Window(1024, 1024) if '-g' in args else None
+
+    with open(args[1]) as fp:
        genomes = Genome.from_string(fp.read())
    anim = Animation(genomes)
-    accum, den = silly(anim.features, genomes)
+    accum, den = render(anim.features, genomes)

    noalpha = np.delete(accum, 3, axis=2)
    scipy.misc.imsave('rendered.png', noalpha)

+
+
    if '-g' not in args:
        return

@ -66,7 +76,7 @@ def main(args):
    pyglet.app.run()

 if __name__ == "__main__":
-    if len(sys.argv) < 2 or not os.path.isfile(sys.argv[-1]):
+    if len(sys.argv) < 2 or not os.path.isfile(sys.argv[1]):
        print "Last argument must be a path to a genome file"
        sys.exit(1)
    main(sys.argv)