2014-07-08 03:11:14 -04:00
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include "EmberCLPch.h"
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// Various data structures defined for the CPU and OpenCL.
|
|
|
|
/// These are stripped down versions of THE classes in Ember, for use with OpenCL.
|
|
|
|
/// Their sole purpose is to pass values from the host to the device.
|
|
|
|
/// They retain most of the member variables, but do not contain the functions.
|
|
|
|
/// Visual Studio defaults to alighment of 16, but it's made explicit in case another compiler is used.
|
|
|
|
/// This must match the alignment specified in the kernel.
|
|
|
|
/// </summary>
|
|
|
|
|
|
|
|
namespace EmberCLns
|
|
|
|
{
|
|
|
|
/// <summary>
|
|
|
|
/// Various constants needed for rendering.
|
|
|
|
/// </summary>
|
|
|
|
static string ConstantDefinesString(bool doublePrecision)
|
|
|
|
{
|
|
|
|
ostringstream os;
|
2018-03-28 00:32:10 -04:00
|
|
|
os << "#if defined(cl_amd_fp64)\n"//AMD extension available?
|
|
|
|
" #pragma OPENCL EXTENSION cl_amd_fp64 : enable\n"
|
|
|
|
"#endif\n"
|
|
|
|
"#if defined(cl_khr_fp64)\n"//Khronos extension available?
|
|
|
|
" #pragma OPENCL EXTENSION cl_khr_fp64 : enable\n"
|
|
|
|
"#endif\n"
|
|
|
|
"#pragma OPENCL EXTENSION cl_khr_int64_base_atomics : enable\n";//Only supported on nVidia.
|
2014-07-08 03:11:14 -04:00
|
|
|
|
|
|
|
if (doublePrecision)
|
|
|
|
{
|
2018-03-28 00:32:10 -04:00
|
|
|
os <<
|
2015-12-31 16:41:59 -05:00
|
|
|
"typedef long intPrec;\n"
|
|
|
|
"typedef uint atomi;\n"//Same size as real_bucket_t, always 4 bytes.
|
|
|
|
"typedef double real_t;\n"
|
|
|
|
"typedef float real_bucket_t;\n"//Assume buckets are always float, even though iter calcs are in double.
|
|
|
|
"typedef double2 real2;\n"
|
|
|
|
"typedef double3 real3;\n"
|
|
|
|
"typedef double4 real4;\n"
|
|
|
|
"typedef float4 real4_bucket;\n"//And here too.
|
|
|
|
"#define EPS (DBL_EPSILON)\n"
|
|
|
|
"#define TLOW (DBL_MIN)\n"
|
|
|
|
"#define TMAX (DBL_MAX)\n"
|
|
|
|
;
|
2014-07-08 03:11:14 -04:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
os << "typedef int intPrec;\n"
|
2015-12-31 16:41:59 -05:00
|
|
|
"typedef uint atomi;\n"
|
|
|
|
"typedef float real_t;\n"
|
|
|
|
"typedef float real_bucket_t;\n"
|
|
|
|
"typedef float2 real2;\n"
|
|
|
|
"typedef float3 real3;\n"
|
|
|
|
"typedef float4 real4;\n"
|
|
|
|
"typedef float4 real4_bucket;\n"
|
|
|
|
"#define EPS (FLT_EPSILON)\n"
|
|
|
|
"#define TLOW (FLT_MIN)\n"
|
|
|
|
"#define TMAX (FLT_MAX)\n"
|
|
|
|
;
|
2014-07-08 03:11:14 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
os <<
|
2015-12-31 16:41:59 -05:00
|
|
|
"typedef long int int64;\n"
|
|
|
|
"typedef unsigned long int uint64;\n"
|
|
|
|
"\n"
|
|
|
|
"#define EPS6 ((1e-6))\n"
|
|
|
|
"\n"
|
|
|
|
"//The number of threads per block used in the iteration function. Don't change\n"
|
|
|
|
"//it lightly; the block size is hard coded to be exactly 32 x 8.\n"
|
|
|
|
"#define NTHREADS 256u\n"
|
|
|
|
"#define THREADS_PER_WARP 32u\n"
|
|
|
|
"#define NWARPS (NTHREADS / THREADS_PER_WARP)\n"
|
|
|
|
"#define DE_THRESH 100u\n"
|
2018-09-22 01:42:18 -04:00
|
|
|
"#define BadVal(x) (isnan(x))\n"
|
2015-12-31 16:41:59 -05:00
|
|
|
"#define SQR(x) ((x) * (x))\n"
|
|
|
|
"#define CUBE(x) ((x) * (x) * (x))\n"
|
2017-07-05 02:08:06 -04:00
|
|
|
"#define MPI ((real_t)M_PI)\n"
|
|
|
|
"#define MPI2 ((real_t)M_PI_2)\n"
|
|
|
|
"#define MPI4 ((real_t)M_PI_4)\n"
|
|
|
|
"#define M1PI ((real_t)M_1_PI)\n"
|
|
|
|
"#define M2PI ((real_t)M_2_PI)\n"
|
|
|
|
"#define M_2PI (MPI * 2)\n"
|
|
|
|
"#define M_3PI (MPI * 3)\n"
|
2015-12-31 16:41:59 -05:00
|
|
|
"#define SQRT5 2.2360679774997896964091736687313\n"
|
|
|
|
"#define M_PHI 1.61803398874989484820458683436563\n"
|
--User changes
-Add new variations waves22, waves23, waves42, waves3 and waves4 from user tatasz.
-Add new stylesheet called lightdark.qss which gives a more modern look to the dark theme. Started by Michel Mastriani (triptychaos).
--Included in the qmake and Wix installers.
--Code changes
-Add a new C# project that attempts to convert Apophysis plugins to Fractorium style Variation classes. It's not entirely perfect, but gets most of the job done much more quickly than doing so manually.
-Remove unused OpenCL functions from variations: elliptic, poincare, mask, bMod, bSwirl, bTransform, bCollide, farblur, popcorn2_3D, falloff, falloff2, falloff3, crackle2, waves2b, hypercrop, depth_gaussian2, depth_sine, depth_sine2, dust, asteria, vibration, vibration2, arctanh, smartshape, squares, starblur2, Truchet,.
-Add code in EmberTester to automatically detect such unused functions.
2019-05-06 22:29:27 -04:00
|
|
|
"#define M_1_2PI 0.15915494309189533576888376337251\n"
|
2017-07-05 02:08:06 -04:00
|
|
|
"#define DEG_2_RAD (MPI / 180)\n"
|
2017-08-07 22:53:13 -04:00
|
|
|
"#define CURVES_LENGTH_M1 ((real_bucket_t)" << CURVES_LENGTH_M1 << ")\n" <<
|
|
|
|
"#define ONE_OVER_CURVES_LENGTH_M1 ((real_bucket_t)" << ONE_OVER_CURVES_LENGTH_M1 << ")\n" <<
|
2015-12-31 16:41:59 -05:00
|
|
|
"\n"
|
|
|
|
"//Index in each dimension of a thread within a block.\n"
|
|
|
|
"#define THREAD_ID_X (get_local_id(0))\n"
|
|
|
|
"#define THREAD_ID_Y (get_local_id(1))\n"
|
|
|
|
"#define THREAD_ID_Z (get_local_id(2))\n"
|
|
|
|
"\n"
|
|
|
|
"//Index in each dimension of a block within a grid.\n"
|
|
|
|
"#define BLOCK_ID_X (get_group_id(0))\n"
|
|
|
|
"#define BLOCK_ID_Y (get_group_id(1))\n"
|
|
|
|
"#define BLOCK_ID_Z (get_group_id(2))\n"
|
|
|
|
"\n"
|
|
|
|
"//Absolute index in each dimension of a thread within a grid.\n"
|
|
|
|
"#define GLOBAL_ID_X (get_global_id(0))\n"
|
|
|
|
"#define GLOBAL_ID_Y (get_global_id(1))\n"
|
|
|
|
"#define GLOBAL_ID_Z (get_global_id(2))\n"
|
|
|
|
"\n"
|
|
|
|
"//Dimensions of a block.\n"
|
|
|
|
"#define BLOCK_SIZE_X (get_local_size(0))\n"
|
|
|
|
"#define BLOCK_SIZE_Y (get_local_size(1))\n"
|
|
|
|
"#define BLOCK_SIZE_Z (get_local_size(2))\n"
|
|
|
|
"\n"
|
|
|
|
"//Dimensions of a grid, in terms of blocks.\n"
|
|
|
|
"#define GRID_SIZE_X (get_num_groups(0))\n"
|
|
|
|
"#define GRID_SIZE_Y (get_num_groups(1))\n"
|
|
|
|
"#define GRID_SIZE_Z (get_num_groups(2))\n"
|
|
|
|
"\n"
|
|
|
|
"//Dimensions of a grid, in terms of threads.\n"
|
|
|
|
"#define GLOBAL_SIZE_X (get_global_size(0))\n"
|
|
|
|
"#define GLOBAL_SIZE_Y (get_global_size(1))\n"
|
|
|
|
"#define GLOBAL_SIZE_Z (get_global_size(2))\n"
|
|
|
|
"\n"
|
|
|
|
"#define INDEX_IN_BLOCK_2D (THREAD_ID_Y * BLOCK_SIZE_X + THREAD_ID_X)\n"
|
|
|
|
"#define INDEX_IN_BLOCK_3D ((BLOCK_SIZE_X * BLOCK_SIZE_Y * THREAD_ID_Z) + INDEX_IN_BLOCK_2D)\n"
|
|
|
|
"\n"
|
|
|
|
"#define INDEX_IN_GRID_2D (GLOBAL_ID_Y * GLOBAL_SIZE_X + GLOBAL_ID_X)\n"
|
|
|
|
"#define INDEX_IN_GRID_3D ((GLOBAL_SIZE_X * GLOBAL_SIZE_Y * GLOBAL_ID_Z) + INDEX_IN_GRID_2D)\n"
|
|
|
|
"\n";
|
2014-07-08 03:11:14 -04:00
|
|
|
return os.str();
|
|
|
|
}
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// A point structure on the host that maps to the one used on the device to iterate in OpenCL.
|
|
|
|
/// It might seem better to use vec4, however 2D palettes and even 3D coordinates may eventually
|
|
|
|
/// be supported, which will make it more than 4 members.
|
|
|
|
/// </summary>
|
|
|
|
template <typename T>
|
|
|
|
struct ALIGN PointCL
|
|
|
|
{
|
|
|
|
T m_X;
|
|
|
|
T m_Y;
|
|
|
|
T m_Z;
|
|
|
|
T m_ColorX;
|
2014-12-06 00:05:09 -05:00
|
|
|
uint m_LastXfUsed;
|
2014-07-08 03:11:14 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// The point structure used to iterate in OpenCL.
|
|
|
|
/// It might seem better to use float4, however 2D palettes and even 3D coordinates may eventually
|
|
|
|
/// be supported, which will make it more than 4 members.
|
|
|
|
/// </summary>
|
|
|
|
static const char* PointCLStructString =
|
2015-12-31 16:41:59 -05:00
|
|
|
"typedef struct __attribute__ " ALIGN_CL " _Point\n"
|
|
|
|
"{\n"
|
|
|
|
" real_t m_X;\n"
|
|
|
|
" real_t m_Y;\n"
|
|
|
|
" real_t m_Z;\n"
|
|
|
|
" real_t m_ColorX;\n"
|
|
|
|
" uint m_LastXfUsed;\n"
|
|
|
|
"} Point;\n"
|
|
|
|
"\n";
|
2014-07-08 03:11:14 -04:00
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// A structure on the host used to hold all of the needed information for an xform used on the device to iterate in OpenCL.
|
|
|
|
/// Template argument expected to be float or double.
|
|
|
|
/// </summary>
|
|
|
|
template <typename T>
|
|
|
|
struct ALIGN XformCL
|
|
|
|
{
|
|
|
|
T m_A, m_B, m_C, m_D, m_E, m_F;//24 (48)
|
--User changes
-Support 4k monitors, and in general, properly scale any monitor that is not HD.
-Allow for a spatial filter of radius zero, which means do not use a spatial filter.
-Add new variations: concentric, cpow3, helicoid, helix, rand_cubes, sphereblur.
-Use a new method for computing elliptic which is more precise. Developed by Discord user Claude.
-Remove the 8 variation per xform limitation on the GPU.
-Allow for loading the last flame file on startup, rather than randoms.
-Use two different default quality values in the interactive renderer, one each for CPU and GPU.
-Creating linked xforms was using non-standard behavior. Make it match Apo and also support creating multiple linked xforms at once.
--Bug fixes
-No variations in an xform used to have the same behavior as a single linear variation with weight 1. While sensible, this breaks backward compatibility. No variations now sets the output point to zeroes.
-Prevent crashing the program when adjusting a value on the main window while a final render is in progress.
-The xaos table was inverted.
--Code changes
-Convert projects to Visual Studio 2017.
-Change bad vals from +- 1e10 to +-1e20.
-Reintroduce the symmetry tag in xforms for legacy support in programs that do not use color_speed.
-Compiler will not let us use default values in templated member functions anymore.
2017-11-26 20:27:00 -05:00
|
|
|
T m_PostA, m_PostB, m_PostC, m_PostD, m_PostE, m_PostF;//48 (96)
|
|
|
|
T m_DirectColor;//52 (104)
|
|
|
|
T m_ColorSpeedCache;//56 (112)
|
|
|
|
T m_OneMinusColorCache;//60 (120)
|
|
|
|
T m_Opacity;//64 (128)
|
2014-07-08 03:11:14 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// The xform structure used to iterate in OpenCL.
|
|
|
|
/// </summary>
|
|
|
|
static const char* XformCLStructString =
|
2015-12-31 16:41:59 -05:00
|
|
|
"typedef struct __attribute__ " ALIGN_CL " _XformCL\n"
|
|
|
|
"{\n"
|
|
|
|
" real_t m_A, m_B, m_C, m_D, m_E, m_F;\n"
|
|
|
|
" real_t m_PostA, m_PostB, m_PostC, m_PostD, m_PostE, m_PostF;\n"
|
|
|
|
" real_t m_DirectColor;\n"
|
|
|
|
" real_t m_ColorSpeedCache;\n"
|
|
|
|
" real_t m_OneMinusColorCache;\n"
|
|
|
|
" real_t m_Opacity;\n"
|
|
|
|
"} XformCL;\n"
|
|
|
|
"\n";
|
2014-07-08 03:11:14 -04:00
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// A structure on the host used to hold all of the needed information for an ember used on the device to iterate in OpenCL.
|
|
|
|
/// Template argument expected to be float or double.
|
|
|
|
/// </summary>
|
|
|
|
template <typename T>
|
|
|
|
struct ALIGN EmberCL
|
|
|
|
{
|
--User changes:
-Show common folder locations such as documents, downloads, pictures in the sidebar in all file dialogs.
-Warning message about exceeding memory in final render dialog now suggests strips as the solution to the problem.
-Strips now has a tooltip explaining what it does.
-Allow more digits in the spinners on the color section the flame tab.
-Add manually adjustable size spinners in the final render dialog. Percentage scale and absolute size are fully synced.
-Default prefix in final render is now the filename when doing animations (coming from sequence section of the library tab).
-Changed the elliptic variation back to using a less precise version for float, and a more precise version for double. The last release had it always using double.
-New applied xaos table that shows a read-only view of actual weights by taking the base xform weights and multiplying them by the xaos values.
-New table in the xaos tab that gives a graphical representation of the probability that each xform is chosen, with and without xaos.
-Add button to transpose the xaos rows and columns.
-Add support for importing .chaos files from Chaotica.
--Pasting back to Chaotica will work for most, but not all, variations due to incompatible parameter names in some.
-Curves are now splines instead of Bezier. This adds compatibility with Chaotica, but breaks it for Apophysis. Xmls are still pastable, but the color curves will look different.
--The curve editor on the palette tab can now add points by clicking on the lines and remove points by clicking on the points themselves, just like Chaotica.
--Splines are saved in four new xml fields: overall_curve, red_curve, green_curve and blue_curve.
-Allow for specifying the percentage of a sub batch each thread should iterate through per kernel call when running with OpenCL. This gives a roughly 1% performance increase due to having to make less kernel calls while iterating.
--This field is present for interactive editing (where it's not very useful) and in the final render dialog.
--On the command line, this is specified as --sbpctth for EmberRender and EmberAnimate.
-Allow double clicking to toggle the supersample field in the flame tab between 1 and 2 for easily checking the effect of the field.
-When showing affine values as polar coordinates, show angles normalized to 360 to match Chaotica.
-Fuse Count spinner now toggles between 15 and 100 when double clicking for easily checking the effect of the field.
-Added field for limiting the range in the x and y direction that the initial points are chosen from.
-Added a field called K2 which is an alternative way to set brightness, ignored when zero.
--This has no effect for many variations, but hs a noticeable effect for some.
-Added new variations:
arcsech
arcsech2
arcsinh
arctanh
asteria
block
bwraps_rand
circlecrop2
coth_spiral
crackle2
depth_blur
depth_blur2
depth_gaussian
depth_gaussian2
depth_ngon
depth_ngon2
depth_sine
depth_sine2
dragonfire
dspherical
dust
excinis
exp2
flipx
flowerdb
foci_p
gaussian
glynnia2
glynnsim4
glynnsim5
henon
henon
hex_rand
hex_truchet
hypershift
lazyjess
lens
lozi
lozi
modulusx
modulusy
oscilloscope2
point_symmetry
pointsymmetry
projective
pulse
rotate
scry2
shift
smartshape
spher
squares
starblur2
swirl3
swirl3r
tanh_spiral
target0
target2
tile_hlp
truchet_glyph
truchet_inv
truchet_knot
unicorngaloshen
vibration
vibration2
--hex_truchet, hex_rand should always use double. They are extremely sensitive.
--Bug fixes:
-Bounds sign was flipped for x coordinate of world space when center was not zero.
-Right clicking and dragging spinner showed menu on mouse up, even if it was very far away.
-Text boxes for size in final render dialog were hard to type in. Same bug as xform weight used to be so fix the same way.
-Fix spelling to be plural in toggle color speed box.
-Stop using the blank user palette to generate flames. Either put colored palettes in it, or exclude it from randoms.
-Clicking the random palette button for a palette file with only one palette in it would freeze the program.
-Clicking none scale in final render did not re-render the preview.
-Use less precision on random xaos. No need for 12 decimal places.
-The term sub batch is overloaded in the options dialog. Change the naming and tooltip of those settings for cpu and opencl.
--Also made clear in the tooltip for the default opencl quality setting that the value is per device.
-The arrows spinner in palette editor appears like a read-only label. Made it look like a spinner.
-Fix border colors for various spin boxes and table headers in the style sheet. Requires reload.
-Fix a bug in the bwraps variation which would produce different results than Chaotica and Apophysis.
-Synth was allowed to be selected for random flame generation when using an Nvidia card but it shouldn't have been because Nvidia has a hard time compiling synth.
-A casting bug in the OpenCL kernels for log scaling and density filtering was preventing successful compilations on Intel iGPUs. Fixed even though we don't support anything other than AMD and Nvidia.
-Palette rotation (click and drag) position was not being reset when loading a new flame.
-When the xform circles were hidden, opening and closing the options dialog would improperly reshow them.
-Double click toggle was broken on integer spin boxes.
-Fixed tab order of some controls.
-Creating a palette from a jpg in the palette editor only produced a single color.
--Needed to package imageformats/qjpeg.dll with the Windows installer.
-The basic memory benchmark test flame was not really testing memory. Make it more spread out.
-Remove the temporal samples field from the flame tab, it was never used because it's only an animation parameter which is specified in the final render dialog or on the command line with EmberAnimate.
--Code changes:
-Add IsEmpty() to Palette to determine if a palette is all black.
-Attempt to avoid selecting a blank palette in PaletteList::GetRandomPalette().
-Add function ScanForChaosNodes() and some associated helper functions in XmlToEmber.
-Make variation param name correction be case insensitive in XmlToEmber.
-Report error when assigning a variation param value in XmlToEmber.
-Add SubBatchPercentPerThread() method to RendererCL.
-Override enterEvent() and leaveEvent() in DoubleSpinBox and SpinBox to prevent the context menu from showing up on right mouse up after already leaving the spinner.
-Filtering the mouse wheel event in TableWidget no longer appears to be needed. It was probably an old Qt bug that has been fixed.
-Gui/ember syncing code in the final render dialog needed to be reworked to accommodate absolute sizes.
2019-04-13 22:00:46 -04:00
|
|
|
T m_RandPointRange;
|
2014-07-08 03:11:14 -04:00
|
|
|
T m_CamZPos;
|
|
|
|
T m_CamPerspective;
|
|
|
|
T m_CamYaw;
|
|
|
|
T m_CamPitch;
|
|
|
|
T m_CamDepthBlur;
|
|
|
|
T m_BlurCoef;
|
|
|
|
m3T m_CamMat;
|
|
|
|
T m_CenterX, m_CenterY;
|
|
|
|
T m_RotA, m_RotB, m_RotD, m_RotE;
|
2019-04-23 22:50:42 -04:00
|
|
|
T m_Psm1;
|
|
|
|
T m_Psm2;
|
2014-07-08 03:11:14 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// The ember structure used to iterate in OpenCL.
|
|
|
|
/// </summary>
|
|
|
|
static const char* EmberCLStructString =
|
2015-12-31 16:41:59 -05:00
|
|
|
"typedef struct __attribute__ " ALIGN_CL " _EmberCL\n"
|
|
|
|
"{\n"
|
--User changes:
-Show common folder locations such as documents, downloads, pictures in the sidebar in all file dialogs.
-Warning message about exceeding memory in final render dialog now suggests strips as the solution to the problem.
-Strips now has a tooltip explaining what it does.
-Allow more digits in the spinners on the color section the flame tab.
-Add manually adjustable size spinners in the final render dialog. Percentage scale and absolute size are fully synced.
-Default prefix in final render is now the filename when doing animations (coming from sequence section of the library tab).
-Changed the elliptic variation back to using a less precise version for float, and a more precise version for double. The last release had it always using double.
-New applied xaos table that shows a read-only view of actual weights by taking the base xform weights and multiplying them by the xaos values.
-New table in the xaos tab that gives a graphical representation of the probability that each xform is chosen, with and without xaos.
-Add button to transpose the xaos rows and columns.
-Add support for importing .chaos files from Chaotica.
--Pasting back to Chaotica will work for most, but not all, variations due to incompatible parameter names in some.
-Curves are now splines instead of Bezier. This adds compatibility with Chaotica, but breaks it for Apophysis. Xmls are still pastable, but the color curves will look different.
--The curve editor on the palette tab can now add points by clicking on the lines and remove points by clicking on the points themselves, just like Chaotica.
--Splines are saved in four new xml fields: overall_curve, red_curve, green_curve and blue_curve.
-Allow for specifying the percentage of a sub batch each thread should iterate through per kernel call when running with OpenCL. This gives a roughly 1% performance increase due to having to make less kernel calls while iterating.
--This field is present for interactive editing (where it's not very useful) and in the final render dialog.
--On the command line, this is specified as --sbpctth for EmberRender and EmberAnimate.
-Allow double clicking to toggle the supersample field in the flame tab between 1 and 2 for easily checking the effect of the field.
-When showing affine values as polar coordinates, show angles normalized to 360 to match Chaotica.
-Fuse Count spinner now toggles between 15 and 100 when double clicking for easily checking the effect of the field.
-Added field for limiting the range in the x and y direction that the initial points are chosen from.
-Added a field called K2 which is an alternative way to set brightness, ignored when zero.
--This has no effect for many variations, but hs a noticeable effect for some.
-Added new variations:
arcsech
arcsech2
arcsinh
arctanh
asteria
block
bwraps_rand
circlecrop2
coth_spiral
crackle2
depth_blur
depth_blur2
depth_gaussian
depth_gaussian2
depth_ngon
depth_ngon2
depth_sine
depth_sine2
dragonfire
dspherical
dust
excinis
exp2
flipx
flowerdb
foci_p
gaussian
glynnia2
glynnsim4
glynnsim5
henon
henon
hex_rand
hex_truchet
hypershift
lazyjess
lens
lozi
lozi
modulusx
modulusy
oscilloscope2
point_symmetry
pointsymmetry
projective
pulse
rotate
scry2
shift
smartshape
spher
squares
starblur2
swirl3
swirl3r
tanh_spiral
target0
target2
tile_hlp
truchet_glyph
truchet_inv
truchet_knot
unicorngaloshen
vibration
vibration2
--hex_truchet, hex_rand should always use double. They are extremely sensitive.
--Bug fixes:
-Bounds sign was flipped for x coordinate of world space when center was not zero.
-Right clicking and dragging spinner showed menu on mouse up, even if it was very far away.
-Text boxes for size in final render dialog were hard to type in. Same bug as xform weight used to be so fix the same way.
-Fix spelling to be plural in toggle color speed box.
-Stop using the blank user palette to generate flames. Either put colored palettes in it, or exclude it from randoms.
-Clicking the random palette button for a palette file with only one palette in it would freeze the program.
-Clicking none scale in final render did not re-render the preview.
-Use less precision on random xaos. No need for 12 decimal places.
-The term sub batch is overloaded in the options dialog. Change the naming and tooltip of those settings for cpu and opencl.
--Also made clear in the tooltip for the default opencl quality setting that the value is per device.
-The arrows spinner in palette editor appears like a read-only label. Made it look like a spinner.
-Fix border colors for various spin boxes and table headers in the style sheet. Requires reload.
-Fix a bug in the bwraps variation which would produce different results than Chaotica and Apophysis.
-Synth was allowed to be selected for random flame generation when using an Nvidia card but it shouldn't have been because Nvidia has a hard time compiling synth.
-A casting bug in the OpenCL kernels for log scaling and density filtering was preventing successful compilations on Intel iGPUs. Fixed even though we don't support anything other than AMD and Nvidia.
-Palette rotation (click and drag) position was not being reset when loading a new flame.
-When the xform circles were hidden, opening and closing the options dialog would improperly reshow them.
-Double click toggle was broken on integer spin boxes.
-Fixed tab order of some controls.
-Creating a palette from a jpg in the palette editor only produced a single color.
--Needed to package imageformats/qjpeg.dll with the Windows installer.
-The basic memory benchmark test flame was not really testing memory. Make it more spread out.
-Remove the temporal samples field from the flame tab, it was never used because it's only an animation parameter which is specified in the final render dialog or on the command line with EmberAnimate.
--Code changes:
-Add IsEmpty() to Palette to determine if a palette is all black.
-Attempt to avoid selecting a blank palette in PaletteList::GetRandomPalette().
-Add function ScanForChaosNodes() and some associated helper functions in XmlToEmber.
-Make variation param name correction be case insensitive in XmlToEmber.
-Report error when assigning a variation param value in XmlToEmber.
-Add SubBatchPercentPerThread() method to RendererCL.
-Override enterEvent() and leaveEvent() in DoubleSpinBox and SpinBox to prevent the context menu from showing up on right mouse up after already leaving the spinner.
-Filtering the mouse wheel event in TableWidget no longer appears to be needed. It was probably an old Qt bug that has been fixed.
-Gui/ember syncing code in the final render dialog needed to be reworked to accommodate absolute sizes.
2019-04-13 22:00:46 -04:00
|
|
|
" real_t m_RandPointRange;\n"
|
2015-12-31 16:41:59 -05:00
|
|
|
" real_t m_CamZPos;\n"
|
|
|
|
" real_t m_CamPerspective;\n"
|
|
|
|
" real_t m_CamYaw;\n"
|
|
|
|
" real_t m_CamPitch;\n"
|
|
|
|
" real_t m_CamDepthBlur;\n"
|
|
|
|
" real_t m_BlurCoef;\n"
|
|
|
|
" real_t m_C00;\n"
|
|
|
|
" real_t m_C01;\n"
|
|
|
|
" real_t m_C02;\n"
|
|
|
|
" real_t m_C10;\n"
|
|
|
|
" real_t m_C11;\n"
|
|
|
|
" real_t m_C12;\n"
|
|
|
|
" real_t m_C20;\n"
|
|
|
|
" real_t m_C21;\n"
|
|
|
|
" real_t m_C22;\n"
|
|
|
|
" real_t m_CenterX, m_CenterY;\n"
|
|
|
|
" real_t m_RotA, m_RotB, m_RotD, m_RotE;\n"
|
2019-04-23 22:50:42 -04:00
|
|
|
" real_t m_Psm1;\n"
|
|
|
|
" real_t m_Psm2;\n"
|
2015-12-31 16:41:59 -05:00
|
|
|
"} EmberCL;\n"
|
|
|
|
"\n";
|
2014-07-08 03:11:14 -04:00
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// A structure on the host used to hold all of the needed information for cartesian to raster mapping used on the device to iterate in OpenCL.
|
|
|
|
/// Template argument expected to be float or double.
|
|
|
|
/// </summary>
|
|
|
|
template <typename T>
|
|
|
|
struct ALIGN CarToRasCL
|
|
|
|
{
|
|
|
|
T m_PixPerImageUnitW, m_RasLlX;
|
2014-12-06 00:05:09 -05:00
|
|
|
uint m_RasWidth;
|
2014-07-08 03:11:14 -04:00
|
|
|
T m_PixPerImageUnitH, m_RasLlY;
|
|
|
|
T m_CarLlX, m_CarUrX, m_CarUrY, m_CarLlY;
|
|
|
|
};
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// The cartesian to raster structure used to iterate in OpenCL.
|
|
|
|
/// </summary>
|
|
|
|
static const char* CarToRasCLStructString =
|
2015-12-31 16:41:59 -05:00
|
|
|
"typedef struct __attribute__ " ALIGN_CL " _CarToRasCL\n"
|
|
|
|
"{\n"
|
|
|
|
" real_t m_PixPerImageUnitW, m_RasLlX;\n"
|
|
|
|
" uint m_RasWidth;\n"
|
|
|
|
" real_t m_PixPerImageUnitH, m_RasLlY;\n"
|
|
|
|
" real_t m_CarLlX, m_CarUrX, m_CarUrY, m_CarLlY;\n"
|
|
|
|
"} CarToRasCL;\n"
|
|
|
|
"\n";
|
2014-07-08 03:11:14 -04:00
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// A structure on the host used to hold all of the needed information for density filtering used on the device to iterate in OpenCL.
|
|
|
|
/// Note that the actual filter buffer is held elsewhere.
|
|
|
|
/// Template argument expected to be float or double.
|
|
|
|
/// </summary>
|
|
|
|
template <typename T>
|
|
|
|
struct ALIGN DensityFilterCL
|
|
|
|
{
|
|
|
|
T m_Curve;
|
|
|
|
T m_K1;
|
|
|
|
T m_K2;
|
2014-12-06 00:05:09 -05:00
|
|
|
uint m_Supersample;
|
|
|
|
uint m_SuperRasW;
|
|
|
|
uint m_SuperRasH;
|
|
|
|
uint m_KernelSize;
|
|
|
|
uint m_MaxFilterIndex;
|
|
|
|
uint m_MaxFilteredCounts;
|
|
|
|
uint m_FilterWidth;
|
2014-07-08 03:11:14 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// The density filtering structure used to iterate in OpenCL.
|
|
|
|
/// Note that the actual filter buffer is held elsewhere.
|
|
|
|
/// </summary>
|
|
|
|
static const char* DensityFilterCLStructString =
|
2015-12-31 16:41:59 -05:00
|
|
|
"typedef struct __attribute__ " ALIGN_CL " _DensityFilterCL\n"
|
|
|
|
"{\n"
|
|
|
|
" real_bucket_t m_Curve;\n"
|
|
|
|
" real_bucket_t m_K1;\n"
|
|
|
|
" real_bucket_t m_K2;\n"
|
|
|
|
" uint m_Supersample;\n"
|
|
|
|
" uint m_SuperRasW;\n"
|
|
|
|
" uint m_SuperRasH;\n"
|
|
|
|
" uint m_KernelSize;\n"
|
|
|
|
" uint m_MaxFilterIndex;\n"
|
|
|
|
" uint m_MaxFilteredCounts;\n"
|
|
|
|
" uint m_FilterWidth;\n"
|
|
|
|
"} DensityFilterCL;\n"
|
|
|
|
"\n";
|
2014-07-08 03:11:14 -04:00
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// A structure on the host used to hold all of the needed information for spatial filtering used on the device to iterate in OpenCL.
|
|
|
|
/// Note that the actual filter buffer is held elsewhere.
|
|
|
|
/// </summary>
|
|
|
|
template <typename T>
|
|
|
|
struct ALIGN SpatialFilterCL
|
|
|
|
{
|
2014-12-06 00:05:09 -05:00
|
|
|
uint m_SuperRasW;
|
|
|
|
uint m_SuperRasH;
|
|
|
|
uint m_FinalRasW;
|
|
|
|
uint m_FinalRasH;
|
|
|
|
uint m_Supersample;
|
|
|
|
uint m_FilterWidth;
|
|
|
|
uint m_DensityFilterOffset;
|
|
|
|
uint m_YAxisUp;
|
2014-07-08 03:11:14 -04:00
|
|
|
T m_Vibrancy;
|
|
|
|
T m_HighlightPower;
|
|
|
|
T m_Gamma;
|
|
|
|
T m_LinRange;
|
|
|
|
Color<T> m_Background;
|
|
|
|
};
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// The spatial filtering structure used to iterate in OpenCL.
|
|
|
|
/// Note that the actual filter buffer is held elsewhere.
|
|
|
|
/// </summary>
|
|
|
|
static const char* SpatialFilterCLStructString =
|
2015-12-31 16:41:59 -05:00
|
|
|
"typedef struct __attribute__ ((aligned (16))) _SpatialFilterCL\n"
|
|
|
|
"{\n"
|
|
|
|
" uint m_SuperRasW;\n"
|
|
|
|
" uint m_SuperRasH;\n"
|
|
|
|
" uint m_FinalRasW;\n"
|
|
|
|
" uint m_FinalRasH;\n"
|
|
|
|
" uint m_Supersample;\n"
|
|
|
|
" uint m_FilterWidth;\n"
|
|
|
|
" uint m_DensityFilterOffset;\n"
|
|
|
|
" uint m_YAxisUp;\n"
|
|
|
|
" real_bucket_t m_Vibrancy;\n"
|
|
|
|
" real_bucket_t m_HighlightPower;\n"
|
|
|
|
" real_bucket_t m_Gamma;\n"
|
|
|
|
" real_bucket_t m_LinRange;\n"
|
|
|
|
" real_bucket_t m_Background[4];\n"//For some reason, using float4/double4 here does not align no matter what. So just use an array of 4.
|
|
|
|
"} SpatialFilterCL;\n"
|
|
|
|
"\n";
|
2014-07-08 03:11:14 -04:00
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// EmberCL makes extensive use of the build in vector types, however accessing
|
|
|
|
/// their members as a buffer is not natively supported.
|
|
|
|
/// Declaring them in a union with a buffer resolves this problem.
|
|
|
|
/// </summary>
|
|
|
|
static const char* UnionCLStructString =
|
2015-12-31 16:41:59 -05:00
|
|
|
"typedef union\n"
|
|
|
|
"{\n"
|
|
|
|
" uchar3 m_Uchar3;\n"
|
|
|
|
" uchar m_Uchars[3];\n"
|
|
|
|
"} uchar3uchars;\n"
|
|
|
|
"\n"
|
|
|
|
"typedef union\n"
|
|
|
|
"{\n"
|
|
|
|
" uchar4 m_Uchar4;\n"
|
|
|
|
" uchar m_Uchars[4];\n"
|
|
|
|
"} uchar4uchars;\n"
|
|
|
|
"\n"
|
|
|
|
"typedef union\n"
|
|
|
|
"{\n"
|
|
|
|
" uint4 m_Uint4;\n"
|
|
|
|
" uint m_Uints[4];\n"
|
|
|
|
"} uint4uints;\n"
|
|
|
|
"\n"
|
|
|
|
"typedef union\n"//Use in places where float is required.
|
|
|
|
"{\n"
|
|
|
|
" float4 m_Float4;\n"
|
|
|
|
" float m_Floats[4];\n"
|
|
|
|
"} float4floats;\n"
|
|
|
|
"\n"
|
|
|
|
"typedef union\n"//Use in places where float or double can be used depending on the template type.
|
|
|
|
"{\n"
|
|
|
|
" real4 m_Real4;\n"
|
|
|
|
" real_t m_Reals[4];\n"
|
|
|
|
"} real4reals;\n"
|
|
|
|
"\n"
|
|
|
|
"typedef union\n"//Used to match the bucket template type.
|
|
|
|
"{\n"
|
|
|
|
" real4_bucket m_Real4;\n"
|
|
|
|
" real_bucket_t m_Reals[4];\n"
|
|
|
|
"} real4reals_bucket;\n"
|
|
|
|
"\n";
|
2014-12-05 21:30:46 -05:00
|
|
|
}
|