├── .gitattributes
├── .gitignore
├── LICENSE
├── README.md
├── examples
    └── benchmark
    │   ├── CMakeLists.txt
    │   └── main.cu
└── include
    └── cuda_noise.cuh


/.gitattributes:
--------------------------------------------------------------------------------
 1 | ###############################################################################
 2 | # Set default behavior to automatically normalize line endings.
 3 | ###############################################################################
 4 | * text=auto
 5 | 
 6 | ###############################################################################
 7 | # Set default behavior for command prompt diff.
 8 | #
 9 | # This is need for earlier builds of msysgit that does not have it on by
10 | # default for csharp files.
11 | # Note: This is only used by command line
12 | ###############################################################################
13 | #*.cs     diff=csharp
14 | 
15 | ###############################################################################
16 | # Set the merge driver for project and solution files
17 | #
18 | # Merging from the command prompt will add diff markers to the files if there
19 | # are conflicts (Merging from VS is not affected by the settings below, in VS
20 | # the diff markers are never inserted). Diff markers may cause the following 
21 | # file extensions to fail to load in VS. An alternative would be to treat
22 | # these files as binary and thus will always conflict and require user
23 | # intervention with every merge. To do so, just uncomment the entries below
24 | ###############################################################################
25 | #*.sln       merge=binary
26 | #*.csproj    merge=binary
27 | #*.vbproj    merge=binary
28 | #*.vcxproj   merge=binary
29 | #*.vcproj    merge=binary
30 | #*.dbproj    merge=binary
31 | #*.fsproj    merge=binary
32 | #*.lsproj    merge=binary
33 | #*.wixproj   merge=binary
34 | #*.modelproj merge=binary
35 | #*.sqlproj   merge=binary
36 | #*.wwaproj   merge=binary
37 | 
38 | ###############################################################################
39 | # behavior for image files
40 | #
41 | # image files are treated as binary by default.
42 | ###############################################################################
43 | #*.jpg   binary
44 | #*.png   binary
45 | #*.gif   binary
46 | 
47 | ###############################################################################
48 | # diff behavior for common document formats
49 | # 
50 | # Convert binary document formats to text before diffing them. This feature
51 | # is only available from the command line. Turn it on by uncommenting the 
52 | # entries below.
53 | ###############################################################################
54 | #*.doc   diff=astextplain
55 | #*.DOC   diff=astextplain
56 | #*.docx  diff=astextplain
57 | #*.DOCX  diff=astextplain
58 | #*.dot   diff=astextplain
59 | #*.DOT   diff=astextplain
60 | #*.pdf   diff=astextplain
61 | #*.PDF   diff=astextplain
62 | #*.rtf   diff=astextplain
63 | #*.RTF   diff=astextplain
64 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | ## Ignore Visual Studio temporary files, build results, and
  2 | ## files generated by popular Visual Studio add-ons.
  3 | 
  4 | # User-specific files
  5 | *.suo
  6 | *.user
  7 | *.userosscache
  8 | *.sln.docstates
  9 | 
 10 | # User-specific files (MonoDevelop/Xamarin Studio)
 11 | *.userprefs
 12 | 
 13 | # Build results
 14 | [Dd]ebug/
 15 | [Dd]ebugPublic/
 16 | [Rr]elease/
 17 | [Rr]eleases/
 18 | [Xx]64/
 19 | [Xx]86/
 20 | [Bb]uild/
 21 | bld/
 22 | [Bb]in/
 23 | [Oo]bj/
 24 | 
 25 | # Visual Studio 2015 cache/options directory
 26 | .vs/
 27 | # Uncomment if you have tasks that create the project's static files in wwwroot
 28 | #wwwroot/
 29 | 
 30 | # MSTest test Results
 31 | [Tt]est[Rr]esult*/
 32 | [Bb]uild[Ll]og.*
 33 | 
 34 | # NUNIT
 35 | *.VisualState.xml
 36 | TestResult.xml
 37 | 
 38 | # Build Results of an ATL Project
 39 | [Dd]ebugPS/
 40 | [Rr]eleasePS/
 41 | dlldata.c
 42 | 
 43 | # DNX
 44 | project.lock.json
 45 | artifacts/
 46 | 
 47 | *_i.c
 48 | *_p.c
 49 | *_i.h
 50 | *.ilk
 51 | *.meta
 52 | *.obj
 53 | *.pch
 54 | *.pdb
 55 | *.pgc
 56 | *.pgd
 57 | *.rsp
 58 | *.sbr
 59 | *.tlb
 60 | *.tli
 61 | *.tlh
 62 | *.tmp
 63 | *.tmp_proj
 64 | *.log
 65 | *.vspscc
 66 | *.vssscc
 67 | .builds
 68 | *.pidb
 69 | *.svclog
 70 | *.scc
 71 | 
 72 | # Chutzpah Test files
 73 | _Chutzpah*
 74 | 
 75 | # Visual C++ cache files
 76 | ipch/
 77 | *.aps
 78 | *.ncb
 79 | *.opendb
 80 | *.opensdf
 81 | *.sdf
 82 | *.cachefile
 83 | *.VC.db
 84 | 
 85 | # Visual Studio profiler
 86 | *.psess
 87 | *.vsp
 88 | *.vspx
 89 | *.sap
 90 | 
 91 | # TFS 2012 Local Workspace
 92 | $tf/
 93 | 
 94 | # Guidance Automation Toolkit
 95 | *.gpState
 96 | 
 97 | # ReSharper is a .NET coding add-in
 98 | _ReSharper*/
 99 | *.[Rr]e[Ss]harper
100 | *.DotSettings.user
101 | 
102 | # JustCode is a .NET coding add-in
103 | .JustCode
104 | 
105 | # TeamCity is a build add-in
106 | _TeamCity*
107 | 
108 | # DotCover is a Code Coverage Tool
109 | *.dotCover
110 | 
111 | # NCrunch
112 | _NCrunch_*
113 | .*crunch*.local.xml
114 | nCrunchTemp_*
115 | 
116 | # MightyMoose
117 | *.mm.*
118 | AutoTest.Net/
119 | 
120 | # Web workbench (sass)
121 | .sass-cache/
122 | 
123 | # Installshield output folder
124 | [Ee]xpress/
125 | 
126 | # DocProject is a documentation generator add-in
127 | DocProject/buildhelp/
128 | DocProject/Help/*.HxT
129 | DocProject/Help/*.HxC
130 | DocProject/Help/*.hhc
131 | DocProject/Help/*.hhk
132 | DocProject/Help/*.hhp
133 | DocProject/Help/Html2
134 | DocProject/Help/html
135 | 
136 | # Click-Once directory
137 | publish/
138 | 
139 | # Publish Web Output
140 | *.[Pp]ublish.xml
141 | *.azurePubxml
142 | 
143 | # TODO: Un-comment the next line if you do not want to checkin
144 | # your web deploy settings because they may include unencrypted
145 | # passwords
146 | #*.pubxml
147 | *.publishproj
148 | 
149 | # NuGet Packages
150 | *.nupkg
151 | # The packages folder can be ignored because of Package Restore
152 | **/packages/*
153 | # except build/, which is used as an MSBuild target.
154 | !**/packages/build/
155 | # Uncomment if necessary however generally it will be regenerated when needed
156 | #!**/packages/repositories.config
157 | # NuGet v3's project.json files produces more ignoreable files
158 | *.nuget.props
159 | *.nuget.targets
160 | 
161 | # Microsoft Azure Build Output
162 | csx/
163 | *.build.csdef
164 | 
165 | # Microsoft Azure Emulator
166 | ecf/
167 | rcf/
168 | 
169 | # Windows Store app package directory
170 | AppPackages/
171 | BundleArtifacts/
172 | 
173 | # Visual Studio cache files
174 | # files ending in .cache can be ignored
175 | *.[Cc]ache
176 | # but keep track of directories ending in .cache
177 | !*.[Cc]ache/
178 | 
179 | # Others
180 | ClientBin/
181 | [Ss]tyle[Cc]op.*
182 | ~$*
183 | *~
184 | *.dbmdl
185 | *.dbproj.schemaview
186 | *.pfx
187 | *.publishsettings
188 | node_modules/
189 | orleans.codegen.cs
190 | 
191 | # RIA/Silverlight projects
192 | Generated_Code/
193 | 
194 | # Backup & report files from converting an old project file
195 | # to a newer Visual Studio version. Backup files are not needed,
196 | # because we have git ;-)
197 | _UpgradeReport_Files/
198 | Backup*/
199 | UpgradeLog*.XML
200 | UpgradeLog*.htm
201 | 
202 | # SQL Server files
203 | *.mdf
204 | *.ldf
205 | 
206 | # Business Intelligence projects
207 | *.rdl.data
208 | *.bim.layout
209 | *.bim_*.settings
210 | 
211 | # Microsoft Fakes
212 | FakesAssemblies/
213 | 
214 | # GhostDoc plugin setting file
215 | *.GhostDoc.xml
216 | 
217 | # Node.js Tools for Visual Studio
218 | .ntvs_analysis.dat
219 | 
220 | # Visual Studio 6 build log
221 | *.plg
222 | 
223 | # Visual Studio 6 workspace options file
224 | *.opt
225 | 
226 | # Visual Studio LightSwitch build output
227 | **/*.HTMLClient/GeneratedArtifacts
228 | **/*.DesktopClient/GeneratedArtifacts
229 | **/*.DesktopClient/ModelManifest.xml
230 | **/*.Server/GeneratedArtifacts
231 | **/*.Server/ModelManifest.xml
232 | _Pvt_Extensions
233 | 
234 | # LightSwitch generated files
235 | GeneratedArtifacts/
236 | ModelManifest.xml
237 | 
238 | # Paket dependency manager
239 | .paket/paket.exe
240 | 
241 | # FAKE - F# Make
242 | .fake/
243 | 
244 | # Cmake
245 | cmake-*
246 | 
247 | # Jetbrains
248 | .idea/
249 | **/.idea/*
250 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2017 Henrik Lehtinen
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # cudaNoise
 2 | 
 3 | *Library of common noise functions for CUDA kernels*
 4 | 
 5 | Device functions for use in CUDA kernels which provide tools for generating procedural 3D noise.
 6 | Basis noise functions can be combined for fractional Brownian motion, as well as used to perturb
 7 | the input vector for other noise functions for turbulence effects.
 8 | 
 9 | ## Basis functions
10 | 
11 | ![montage](https://user-images.githubusercontent.com/6199226/202872480-512ab0ef-7210-4eff-8c3c-8179701e1f1e.jpg "Basis functions")
12 | 
13 | *Basis functions include: discrete noise, tricubic value noise, perlin gradient noise, simplex noise, spots and worley noise.*
14 | 
15 | ## Derived functions
16 | 
17 | ![cudanoise](https://user-images.githubusercontent.com/6199226/202872441-bc67fadf-ae3f-44ac-afa1-b65eb60a8562.png "Repeater turbulence")
18 | 
19 | *Repeater turbulence of perlin noise functions.*
20 | 
21 | ## Usage
22 | 
23 | cudaNoise comes as a single-header include library. Simply include cuda_noise.cuh in your CUDA source file, then call the cudaNoise functions from kernel or device functions. 
24 | 
25 | **NOTE: cudaNoise is designed to be used from inside CUDA kernels and cannot directly be called from host code**
26 | 
27 | There is a simple texture viewer included in the /examples directory.
28 | 
29 | ## Reference
30 | 
31 | ### Basis functions
32 | 
33 | #### 3D Checker pattern
34 | 
35 | ```cpp
36 | float checker(float3 pos, float scale, int seed)
37 | ```
38 | 
39 | #### 3D Discrete noise
40 | 
41 | ```cpp
42 | float discreteNoise(float3 pos, float scale, int seed)
43 | ```
44 | 
45 | #### 3D Linear value noise
46 | 
47 | ```cpp
48 | float linearValue(float3 pos, float scale, int seed)
49 | ```
50 | 
51 | #### 3D Cubic value noise
52 | 
53 | ```cpp
54 | float cubicValue(float3 pos, float scale, int seed)
55 | ```
56 | 
57 | #### 3D Perlin gradient noise
58 | 
59 | ```cpp
60 | float perlinNoise(float3 pos, float scale, int seed)
61 | ```
62 | 
63 | #### 3D Simplex noise
64 | 
65 | ```cpp
66 | float simplexNoise(float3 pos, float scale, int seed)
67 | ```
68 | 
69 | #### 3D Worley cellular noise
70 | 
71 | ```cpp
72 | float worleyNoise(float3 pos, float scale, int seed, float size, int minNum, int maxNum, float jitter)
73 | ```
74 | 
75 | #### 3D Spots
76 | 
77 | ```cpp
78 | float spots(float3 pos, float scale, int seed, float size, int minNum, int maxNum, float jitter, profileShape shape)
79 | ```
80 | 
81 | ## TODO
82 | 
83 | - Implement 4D noise functions.
84 | - Optimization work.
85 | - Add more types of cellular functions.
86 | - Cleaning up the interface.
87 | 
88 | Contributions are more than welcome!
89 | 


--------------------------------------------------------------------------------
/examples/benchmark/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 3.17)
 2 | project(benchmark CUDA)
 3 | 
 4 | set(CMAKE_CUDA_STANDARD 14)
 5 | set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -arch=sm_61 -use_fast_math --ptxas-options=-v,-O3")
 6 | message(NVCC Flags: ${CMAKE_CUDA_FLAGS})
 7 | 
 8 | add_executable(benchmark main.cu)
 9 | 
10 | set_target_properties(
11 |         benchmark
12 |         PROPERTIES
13 |         CUDA_SEPARABLE_COMPILATION ON)


--------------------------------------------------------------------------------
/examples/benchmark/main.cu:
--------------------------------------------------------------------------------
  1 | #include <iostream>
  2 | #include <chrono>
  3 | #include <fstream>
  4 | #include <string_view>
  5 | 
  6 | #include "../../include/cuda_noise.cuh"
  7 | 
  8 | __global__ void benchmarkPerlin(unsigned char* outputBuffer, int iterations)
  9 | {
 10 |     int x = threadIdx.x + blockIdx.x * blockDim.x;
 11 |     int y = threadIdx.y + blockIdx.y * blockDim.y;
 12 |     long idx = x + y * blockDim.x *  gridDim.x;
 13 | 
 14 |     float fx = static_cast<float>(x) / (blockDim.x * gridDim.x) * 16.0f;
 15 |     float fy = static_cast<float>(y) / (blockDim.y * gridDim.y) * 16.0f;
 16 | 
 17 |     float3 pos = make_float3(fx, fy, 0.0f);
 18 | 
 19 |     float sum = 0.0f;
 20 |     unsigned int seed = 0x71889283;
 21 |     for(int i = 0; i < iterations; i++)
 22 |     {
 23 |         seed = seed ^ ((i + 91482) * 1778932);
 24 |         sum += cudaNoise::repeaterPerlin(pos, 1.0f, seed, 32, 2.0f, 0.5f);
 25 |     }
 26 | 
 27 |     outputBuffer[idx] = static_cast<unsigned char>((sum / static_cast<float>(iterations)) * 63.0f + 127.0f);
 28 | }
 29 | 
 30 | __global__ void benchmarkSimplex(unsigned char* outputBuffer, int iterations)
 31 | {
 32 |     int x = threadIdx.x + blockIdx.x * blockDim.x;
 33 |     int y = threadIdx.y + blockIdx.y * blockDim.y;
 34 |     long idx = x + y * blockDim.x *  gridDim.x;
 35 | 
 36 |     float fx = static_cast<float>(x) / (blockDim.x * gridDim.x) * 16.0f;
 37 |     float fy = static_cast<float>(y) / (blockDim.y * gridDim.y) * 16.0f;
 38 | 
 39 |     float3 pos = make_float3(fx, fy, 0.0f);
 40 | 
 41 |     float sum = 0.0f;
 42 |     unsigned int seed = 0x71889283;
 43 |     for(int i = 0; i < iterations; i++)
 44 |     {
 45 |         seed = seed ^ ((i + 91482) * 1778932);
 46 |         sum += cudaNoise::repeaterSimplex(pos, 1.0f, seed, 32, 2.0f, 0.5f);
 47 |     }
 48 | 
 49 |     outputBuffer[idx] = static_cast<unsigned char>((sum / static_cast<float>(iterations)) * 127.0f + 127.0f);
 50 | }
 51 | 
 52 | void writeToDisk(unsigned char* buffer, const std::string& filename, size_t datasize)
 53 | {
 54 |     std::fstream file;
 55 |     file.open(filename, std::ios::out | std::ios::binary);
 56 |     file.write(reinterpret_cast<char*>(buffer), datasize);
 57 | }
 58 | 
 59 | int main()
 60 | {
 61 |     std::cout << "Benchmarking cuda-noise..." << std::endl;
 62 | 
 63 |     const size_t DIM = 4096;
 64 |     const int iterations = 32;
 65 | 
 66 |     dim3 blockSize {16, 16};
 67 |     dim3 gridSize { static_cast<int>(DIM) / blockSize.x, static_cast<int>(DIM) / blockSize.y };
 68 | 
 69 |     unsigned char* d_outputBuffer;
 70 |     unsigned char* h_outputBuffer;
 71 | 
 72 |     cudaMalloc((void**)&d_outputBuffer, DIM * DIM * sizeof(unsigned char));
 73 |     cudaMallocHost((void**)&h_outputBuffer, DIM * DIM * sizeof(unsigned char));
 74 | 
 75 |     {
 76 |         auto start = std::chrono::system_clock::now();
 77 |         benchmarkPerlin<<<gridSize, blockSize>>>(d_outputBuffer, iterations);
 78 |         cudaDeviceSynchronize();
 79 |         auto end = std::chrono::system_clock::now();
 80 |         auto elapsed = std::chrono::duration_cast<std::chrono::milliseconds>(end - start);
 81 |         std::cout << "Perlin noise: " << elapsed.count() << " milliseconds" << std::endl;
 82 |     }
 83 | 
 84 |     cudaMemcpy(h_outputBuffer, d_outputBuffer, DIM * DIM * sizeof(unsigned char), cudaMemcpyDeviceToHost);
 85 |     writeToDisk(h_outputBuffer, "perlin.data", DIM * DIM * sizeof(unsigned char));
 86 | 
 87 |     {
 88 |         auto start = std::chrono::system_clock::now();
 89 |         benchmarkSimplex<<<gridSize, blockSize>>>(d_outputBuffer, iterations);
 90 |         cudaDeviceSynchronize();
 91 |         auto end = std::chrono::system_clock::now();
 92 |         auto elapsed = std::chrono::duration_cast<std::chrono::milliseconds>(end - start);
 93 |         std::cout << "Simplex noise: " << elapsed.count() << " milliseconds" << std::endl;
 94 |     }
 95 | 
 96 |     cudaMemcpy(h_outputBuffer, d_outputBuffer, DIM * DIM * sizeof(unsigned char), cudaMemcpyDeviceToHost);
 97 |     writeToDisk(h_outputBuffer, "simplex.data", DIM * DIM * sizeof(unsigned char));
 98 | 
 99 |     cudaFree(d_outputBuffer);
100 |     cudaFreeHost(h_outputBuffer);
101 | 
102 |     return 0;
103 | }
104 | 


--------------------------------------------------------------------------------
/include/cuda_noise.cuh:
--------------------------------------------------------------------------------
  1 | // cudaNoise
  2 | // Library of common 3D noise functions for CUDA kernels
  3 | 
  4 | #pragma once
  5 | 
  6 | #include <cuda_runtime.h>
  7 | 
  8 | namespace cudaNoise {
  9 | 
 10 | 	// Basis functions
 11 | 	typedef enum {
 12 | 		BASIS_CHECKER,
 13 | 		BASIS_DISCRETE,
 14 | 		BASIS_LINEARVALUE,
 15 | 		BASIS_FADEDVALUE,
 16 | 		BASIS_CUBICVALUE,
 17 | 		BASIS_PERLIN,
 18 | 		BASIS_SIMPLEX,
 19 | 		BASIS_WORLEY,
 20 | 		BASIS_SPOTS
 21 | 	} basisFunction;
 22 | 
 23 | 	// Shaping functions
 24 | 	typedef enum {
 25 | 		SHAPE_STEP,
 26 | 		SHAPE_LINEAR,
 27 | 		SHAPE_QUADRATIC
 28 | 	} profileShape;
 29 | 
 30 | 	// Function blending operators
 31 | 	typedef enum {
 32 | 		OPERATOR_ADD,
 33 | 		OPERATOR_AVG,
 34 | 		OPERATOR_MUL,
 35 | 		OPERATOR_MAX,
 36 | 		OPERATOR_MIN
 37 | 	} repeatOperator;
 38 | 
 39 | #define EPSILON 0.000000001f
 40 | 
 41 | 	// Utility functions
 42 | 
 43 | 	// Hashing function (used for fast on-device pseudorandom numbers for randomness in noise)
 44 | 	__device__ unsigned int hash(unsigned int seed)
 45 | 	{
 46 | 		seed = (seed + 0x7ed55d16) + (seed << 12);
 47 | 		seed = (seed ^ 0xc761c23c) ^ (seed >> 19);
 48 | 		seed = (seed + 0x165667b1) + (seed << 5);
 49 | 		seed = (seed + 0xd3a2646c) ^ (seed << 9);
 50 | 		seed = (seed + 0xfd7046c5) + (seed << 3);
 51 | 		seed = (seed ^ 0xb55a4f09) ^ (seed >> 16);
 52 | 
 53 | 		return seed;
 54 | 	}
 55 | 
 56 | 	// Returns a random integer between [min, max]
 57 | 	__device__ int randomIntRange(int min, int max, int seed)
 58 | 	{
 59 | 		int base = hash(seed);
 60 | 		base = base % (1 + max - min) + min;
 61 | 
 62 | 		return base;
 63 | 	}
 64 | 
 65 | 	// Returns a random float between [0, 1]
 66 | 	__device__ float randomFloat(unsigned int seed)
 67 | 	{
 68 | 		unsigned int noiseVal = hash(seed);
 69 | 
 70 | 		return ((float)noiseVal / (float)0xffffffff);
 71 | 	}
 72 | 
 73 | 	// Clamps val between [min, max]
 74 | 	__device__ float clamp(float val, float min, float max)
 75 | 	{
 76 | 		if (val < 0.0f)
 77 | 			return 0.0f;
 78 | 		else if (val > 1.0f)
 79 | 			return 1.0f;
 80 | 
 81 | 		return val;
 82 | 	}
 83 | 
 84 | 	// Maps from the signed range [0, 1] to unsigned [-1, 1]
 85 | 	// NOTE: no clamping
 86 | 	__device__ float mapToSigned(float input)
 87 | 	{
 88 | 		return input * 2.0f - 1.0f;
 89 | 	}
 90 | 
 91 | 	// Maps from the unsigned range [-1, 1] to signed [0, 1]
 92 | 	// NOTE: no clamping
 93 | 	__device__ float mapToUnsigned(float input)
 94 | 	{
 95 | 		return input * 0.5f + 0.5f;
 96 | 	}
 97 | 
 98 | 	// Maps from the signed range [0, 1] to unsigned [-1, 1] with clamping
 99 | 	__device__ float clampToSigned(float input)
100 | 	{
101 | 		return __saturatef(input) * 2.0f - 1.0f;
102 | 	}
103 | 
104 | 	// Maps from the unsigned range [-1, 1] to signed [0, 1] with clamping
105 | 	__device__ float clampToUnsigned(float input)
106 | 	{
107 | 		return __saturatef(input * 0.5f + 0.5f);
108 | 	}
109 | 
110 | 
111 | 	// Random float for a grid coordinate [-1, 1]
112 | 	__device__ float randomGrid(int x, int y, int z, int seed = 0)
113 | 	{
114 | 		return mapToSigned(randomFloat((unsigned int)(x * 1723.0f + y * 93241.0f + z * 149812.0f + 3824.0f + seed)));
115 | 	}
116 | 
117 | 	// Random unsigned int for a grid coordinate [0, MAXUINT]
118 | 	__device__ unsigned int randomIntGrid(float x, float y, float z, float seed = 0.0f)
119 | 	{
120 | 		return hash((unsigned int)(x * 1723.0f + y * 93241.0f + z * 149812.0f + 3824 + seed));
121 | 	}
122 | 
123 | 	// Random 3D vector as float3 from grid position
124 | 	__device__ float3 vectorNoise(int x, int y, int z)
125 | 	{
126 | 		return make_float3(randomFloat(x * 8231.0f + y * 34612.0f + z * 11836.0f + 19283.0f) * 2.0f - 1.0f,
127 | 			randomFloat(x * 1171.0f + y * 9234.0f + z * 992903.0f + 1466.0f) * 2.0f - 1.0f,
128 | 			0.0f);
129 | 	}
130 | 
131 | 	// Scale 3D vector by scalar value
132 | 	__device__ float3 scaleVector(float3 v, float factor)
133 | 	{
134 | 		return make_float3(v.x * factor, v.y * factor, v.z * factor);
135 | 	}
136 | 
137 | 	// Scale 3D vector by nonuniform parameters
138 | 	__device__ float3 nonuniformScaleVector(float3 v, float xf, float yf, float zf)
139 | 	{
140 | 		return make_float3(v.x * xf, v.y * yf, v.z * zf);
141 | 	}
142 | 
143 | 
144 | 	// Adds two 3D vectors
145 | 	__device__ float3 addVectors(float3 v, float3 w)
146 | 	{
147 | 		return make_float3(v.x + w.x, v.y + w.y, v.z + w.z);
148 | 	}
149 | 
150 | 	// Dot product between two vectors
151 | 	__device__ float dotProduct(float3 u, float3 v)
152 | 	{
153 | 		return (u.x * v.x + u.y * v.y + u.z * v.z);
154 | 	}
155 | 
156 | 	// Device constants for noise
157 | 
158 | 	__device__ __constant__ float gradMap[16][3] = { { 1.0f, 1.0f, 0.0f },{ -1.0f, 1.0f, 0.0f },{ 1.0f, -1.0f, 0.0f },{ -1.0f, -1.0f, 0.0f },
159 | 	{ 1.0f, 0.0f, 1.0f },{ -1.0f, 0.0f, 1.0f },{ 1.0f, 0.0f, -1.0f },{ -1.0f, 0.0f, -1.0f },
160 | 	{ 0.0f, 1.0f, 1.0f },{ 0.0f, -1.0f, 1.0f },{ 0.0f, 1.0f, -1.0f },{ 0.0f, -1.0f, -1.0f }};
161 | 
162 | 	// Helper functions for noise
163 | 
164 | 	// Linearly interpolate between two float values
165 | 	__device__  float lerp(float a, float b, float ratio)
166 | 	{
167 | 		return a * (1.0f - ratio) + b * ratio;
168 | 	}
169 | 
170 | 	// 1D cubic interpolation with four points
171 | 	__device__ float cubic(float p0, float p1, float p2, float p3, float x)
172 | 	{
173 | 		return p1 + 0.5f * x * (p2 - p0 + x * (2.0f * p0 - 5.0f * p1 + 4.0f * p2 - p3 + x * (3.0f * (p1 - p2) + p3 - p0)));
174 | 	}
175 | 
176 | 	// Fast gradient function for gradient noise
177 | 	__device__ float grad(int hash, float x, float y, float z)
178 | 	{
179 | 		switch (hash & 0xF)
180 | 		{
181 | 		case 0x0: return x + y;
182 | 		case 0x1: return -x + y;
183 | 		case 0x2: return x - y;
184 | 		case 0x3: return -x - y;
185 | 		case 0x4: return x + z;
186 | 		case 0x5: return -x + z;
187 | 		case 0x6: return x - z;
188 | 		case 0x7: return -x - z;
189 | 		case 0x8: return y + z;
190 | 		case 0x9: return -y + z;
191 | 		case 0xA: return y - z;
192 | 		case 0xB: return -y - z;
193 | 		case 0xC: return y + x;
194 | 		case 0xD: return -y + z;
195 | 		case 0xE: return y - x;
196 | 		case 0xF: return -y - z;
197 | 		default: return 0; // never happens
198 | 		}
199 | 	}
200 | 
201 | 	// Ken Perlin's fade function for Perlin noise
202 | 	__device__ float fade(float t)
203 | 	{
204 | 		return t * t * t * (t * (t * 6.0f - 15.0f) + 10.0f);     // 6t^5 - 15t^4 + 10t^3
205 | 	}
206 | 
207 | 	// Dot product using a float[3] and float parameters
208 | 	// NOTE: could be cleaned up
209 | 	__device__ float dot(float g[3], float x, float y, float z) {
210 | 		return g[0] * x + g[1] * y + g[2] * z;
211 | 	}
212 | 
213 | 	// Random value for simplex noise [0, 255]
214 | 	__device__ unsigned char calcPerm(int p)
215 | 	{
216 | 		return (unsigned char)(hash(p));
217 | 	}
218 | 
219 | 	// Random value for simplex noise [0, 11]
220 | 	__device__ unsigned char calcPerm12(int p)
221 | 	{
222 | 		return (unsigned char)(hash(p) % 12);
223 | 	}
224 | 
225 | 	// Noise functions
226 | 
227 | 	// Simplex noise adapted from Java code by Stefan Gustafson and Peter Eastman
228 | 	__device__ float simplexNoise(float3 pos, float scale, int seed)
229 | 	{
230 | 		float xin = pos.x * scale;
231 | 		float yin = pos.y * scale;
232 | 		float zin = pos.z * scale;
233 | 
234 | 		// Skewing and unskewing factors for 3 dimensions
235 | 		float F3 = 1.0f / 3.0f;
236 | 		float G3 = 1.0f / 6.0f;
237 | 
238 | 		float n0, n1, n2, n3; // Noise contributions from the four corners
239 | 
240 | 								// Skew the input space to determine which simplex cell we're in
241 | 		float s = (xin + yin + zin)*F3; // Very nice and simple skew factor for 3D
242 | 		int i = floorf(xin + s);
243 | 		int j = floorf(yin + s);
244 | 		int k = floorf(zin + s);
245 | 		float t = (i + j + k)*G3;
246 | 		float X0 = i - t; // Unskew the cell origin back to (x,y,z) space
247 | 		float Y0 = j - t;
248 | 		float Z0 = k - t;
249 | 		float x0 = xin - X0; // The x,y,z distances from the cell origin
250 | 		float y0 = yin - Y0;
251 | 		float z0 = zin - Z0;
252 | 
253 | 		// For the 3D case, the simplex shape is a slightly irregular tetrahedron.
254 | 		// Determine which simplex we are in.
255 | 		int i1, j1, k1; // Offsets for second corner of simplex in (i,j,k) coords
256 | 		int i2, j2, k2; // Offsets for third corner of simplex in (i,j,k) coords
257 | 		if (x0 >= y0) {
258 | 			if (y0 >= z0)
259 | 			{
260 | 				i1 = 1.0f; j1 = 0.0f; k1 = 0.0f; i2 = 1.0f; j2 = 1.0f; k2 = 0.0f;
261 | 			} // X Y Z order
262 | 			else if (x0 >= z0) { i1 = 1.0f; j1 = 0.0f; k1 = 0.0f; i2 = 1.0f; j2 = 0.0f; k2 = 1.0f; } // X Z Y order
263 | 			else { i1 = 0.0f; j1 = 0.0f; k1 = 1.0f; i2 = 1.0f; j2 = 0.0f; k2 = 1.0f; } // Z X Y order
264 | 		}
265 | 		else { // x0<y0
266 | 			if (y0 < z0) { i1 = 0.0f; j1 = 0.0f; k1 = 1.0f; i2 = 0.0f; j2 = 1; k2 = 1.0f; } // Z Y X order
267 | 			else if (x0 < z0) { i1 = 0.0f; j1 = 1.0f; k1 = 0.0f; i2 = 0.0f; j2 = 1.0f; k2 = 1.0f; } // Y Z X order
268 | 			else { i1 = 0.0f; j1 = 1.0f; k1 = 0.0f; i2 = 1.0f; j2 = 1.0f; k2 = 0.0f; } // Y X Z order
269 | 		}
270 | 
271 | 		// A step of (1,0,0) in (i,j,k) means a step of (1-c,-c,-c) in (x,y,z),
272 | 		// a step of (0,1,0) in (i,j,k) means a step of (-c,1-c,-c) in (x,y,z), and
273 | 		// a step of (0,0,1) in (i,j,k) means a step of (-c,-c,1-c) in (x,y,z), where
274 | 		// c = 1/6.
275 | 		float x1 = x0 - i1 + G3; // Offsets for second corner in (x,y,z) coords
276 | 		float y1 = y0 - j1 + G3;
277 | 		float z1 = z0 - k1 + G3;
278 | 		float x2 = x0 - i2 + 2.0f*G3; // Offsets for third corner in (x,y,z) coords
279 | 		float y2 = y0 - j2 + 2.0f*G3;
280 | 		float z2 = z0 - k2 + 2.0f*G3;
281 | 		float x3 = x0 - 1.0f + 3.0f*G3; // Offsets for last corner in (x,y,z) coords
282 | 		float y3 = y0 - 1.0f + 3.0f*G3;
283 | 		float z3 = z0 - 1.0f + 3.0f*G3;
284 | 
285 |         int gi0 = calcPerm12(seed + (i * 607495) + (j * 359609) + (k * 654846));
286 |         int gi1 = calcPerm12(seed + (i + i1) * 607495 + (j + j1) * 359609 + (k + k1) * 654846);
287 |         int gi2 = calcPerm12(seed + (i + i2) * 607495 + (j + j2) * 359609 + (k + k2) * 654846);
288 |         int gi3 = calcPerm12(seed + (i + 1) * 607495 + (j + 1) * 359609 + (k + 1) * 654846);
289 | 
290 | 		// Calculate the contribution from the four corners
291 | 		float t0 = 0.6f - x0 * x0 - y0 * y0 - z0 * z0;
292 | 		if (t0 < 0.0f) n0 = 0.0f;
293 | 		else {
294 | 			t0 *= t0;
295 | 			n0 = t0 * t0 * dot(gradMap[gi0], x0, y0, z0);
296 | 		}
297 | 		float t1 = 0.6f - x1 * x1 - y1 * y1 - z1 * z1;
298 | 		if (t1 < 0.0f) n1 = 0.0f;
299 | 		else {
300 | 			t1 *= t1;
301 | 			n1 = t1 * t1 * dot(gradMap[gi1], x1, y1, z1);
302 | 		}
303 | 		float t2 = 0.6f - x2 * x2 - y2 * y2 - z2 * z2;
304 | 		if (t2 < 0.0f) n2 = 0.0f;
305 | 		else {
306 | 			t2 *= t2;
307 | 			n2 = t2 * t2 * dot(gradMap[gi2], x2, y2, z2);
308 | 		}
309 | 		float t3 = 0.6f - x3 * x3 - y3 * y3 - z3 * z3;
310 | 		if (t3 < 0.0f) n3 = 0.0f;
311 | 		else {
312 | 			t3 *= t3;
313 | 			n3 = t3 * t3 * dot(gradMap[gi3], x3, y3, z3);
314 | 		}
315 | 
316 | 		// Add contributions from each corner to get the final noise value.
317 | 		// The result is scaled to stay just inside [-1,1]
318 | 		return 32.0f*(n0 + n1 + n2 + n3);
319 | 	}
320 | 
321 | 	// Checker pattern
322 | 	__device__ float checker(float3 pos, float scale, int seed)
323 | 	{
324 | 		int ix = (int)(pos.x * scale);
325 | 		int iy = (int)(pos.y * scale);
326 | 		int iz = (int)(pos.z * scale);
327 | 
328 | 		if ((ix + iy + iz) % 2 == 0)
329 | 			return 1.0f;
330 | 
331 | 		return -1.0f;
332 | 	}
333 | 
334 | 	// Random spots
335 | 	__device__ float spots(float3 pos, float scale, int seed, float size, int minNum, int maxNum, float jitter, profileShape shape)
336 | 	{
337 | 		if (size < EPSILON)
338 | 			return 0.0f;
339 | 
340 | 		int ix = (int)(pos.x * scale);
341 | 		int iy = (int)(pos.y * scale);
342 | 		int iz = (int)(pos.z * scale);
343 | 
344 | 		float u = pos.x - (float)ix;
345 | 		float v = pos.y - (float)iy;
346 | 		float w = pos.z - (float)iz;
347 | 
348 | 		float val = -1.0f;
349 | 
350 | 		// We need to traverse the entire 3x3x3 neighborhood in case there are spots in neighbors near the edges of the cell
351 | 		for (int x = -1; x < 2; x++)
352 | 		{
353 | 			for (int y = -1; y < 2; y++)
354 | 			{
355 | 				for (int z = -1; z < 2; z++)
356 | 				{
357 | 					int numSpots = randomIntRange(minNum, maxNum, seed + (ix + x) * 823746.0f + (iy + y) * 12306.0f + (iz + z) * 823452.0f + 3234874.0f);
358 | 
359 | 					for (int i = 0; i < numSpots; i++)
360 | 					{
361 | 						float distU = u - x - (randomFloat(seed + (ix + x) * 23784.0f + (iy + y) * 9183.0f + (iz + z) * 23874.0f * i + 27432.0f) * jitter - jitter / 2.0f);
362 | 						float distV = v - y - (randomFloat(seed + (ix + x) * 12743.0f + (iy + y) * 45191.0f + (iz + z) * 144421.0f * i + 76671.0f) * jitter - jitter / 2.0f);
363 | 						float distW = w - z - (randomFloat(seed + (ix + x) * 82734.0f + (iy + y) * 900213.0f + (iz + z) * 443241.0f * i + 199823.0f) * jitter - jitter / 2.0f);
364 | 
365 | 						float distanceSq = distU * distU + distV * distV + distW * distW;
366 | 						float distanceAbs = 0.0f;
367 | 
368 | 						switch (shape)
369 | 						{
370 | 						case(SHAPE_STEP):
371 | 							if (distanceSq < size)
372 | 								val = fmaxf(val, 1.0f);
373 | 							else
374 | 								val = fmaxf(val, -1.0f);
375 | 							break;
376 | 						case(SHAPE_LINEAR):
377 | 							distanceAbs = fabsf(distU) + fabsf(distV) + fabsf(distW);
378 | 							val = fmaxf(val, 1.0f - clamp(distanceAbs, 0.0f, size) / size);
379 | 							break;
380 | 						case(SHAPE_QUADRATIC):
381 | 							val = fmaxf(val, 1.0f - clamp(distanceSq, 0.0f, size) / size);
382 | 							break;
383 | 						}
384 | 					}
385 | 				}
386 | 			}
387 | 		}
388 | 
389 | 		return val;
390 | 	}
391 | 
392 | 	// Worley cellular noise
393 | 	__device__ float worleyNoise(float3 pos, float scale, int seed, float size, int minNum, int maxNum, float jitter)
394 | 	{
395 | 		if (size < EPSILON)
396 | 			return 0.0f;
397 | 
398 | 		int ix = (int)(pos.x * scale);
399 | 		int iy = (int)(pos.y * scale);
400 | 		int iz = (int)(pos.z * scale);
401 | 
402 | 		float u = pos.x - (float)ix;
403 | 		float v = pos.y - (float)iy;
404 | 		float w = pos.z - (float)iz;
405 | 
406 | 		float minDist = 1000000.0f;
407 | 
408 | 		// Traverse the whole 3x3 neighborhood looking for the closest feature point
409 | 		for (int x = -1; x < 2; x++)
410 | 		{
411 | 			for (int y = -1; y < 2; y++)
412 | 			{
413 | 				for (int z = -1; z < 2; z++)
414 | 				{
415 | 					int numPoints = randomIntRange(minNum, maxNum, seed + (ix + x) * 823746.0f + (iy + y) * 12306.0f + (iz + z) * 67262.0f);
416 | 
417 | 					for (int i = 0; i < numPoints; i++)
418 | 					{
419 | 						float distU = u - x - (randomFloat(seed + (ix + x) * 23784.0f + (iy + y) * 9183.0f + (iz + z) * 23874.0f * i + 27432.0f) * jitter - jitter / 2.0f);
420 | 						float distV = v - y - (randomFloat(seed + (ix + x) * 12743.0f + (iy + y) * 45191.0f + (iz + z) * 144421.0f * i + 76671.0f) * jitter - jitter / 2.0f);
421 | 						float distW = w - z - (randomFloat(seed + (ix + x) * 82734.0f + (iy + y) * 900213.0f + (iz + z) * 443241.0f * i + 199823.0f) * jitter - jitter / 2.0f);
422 | 
423 | 						float distanceSq = distU * distU + distV * distV + distW * distW;
424 | 
425 | 						if (distanceSq < minDist)
426 | 							minDist = distanceSq;
427 | 					}
428 | 				}
429 | 			}
430 | 		}
431 | 
432 | 		return __saturatef(minDist) * 2.0f - 1.0f;
433 | 	}
434 | 
435 | 	// Tricubic interpolation
436 | 	__device__ float tricubic(int x, int y, int z, float u, float v, float w)
437 | 	{
438 | 		// interpolate along x first
439 | 		float x00 = cubic(randomGrid(x - 1, y - 1, z - 1), randomGrid(x, y - 1, z - 1), randomGrid(x + 1, y - 1, z - 1), randomGrid(x + 2, y - 1, z - 1), u);
440 | 		float x01 = cubic(randomGrid(x - 1, y - 1, z), randomGrid(x, y - 1, z), randomGrid(x + 1, y - 1, z), randomGrid(x + 2, y - 1, z), u);
441 | 		float x02 = cubic(randomGrid(x - 1, y - 1, z + 1), randomGrid(x, y - 1, z + 1), randomGrid(x + 1, y - 1, z + 1), randomGrid(x + 2, y - 1, z + 1), u);
442 | 		float x03 = cubic(randomGrid(x - 1, y - 1, z + 2), randomGrid(x, y - 1, z + 2), randomGrid(x + 1, y - 1, z + 2), randomGrid(x + 2, y - 1, z + 2), u);
443 | 
444 | 		float x10 = cubic(randomGrid(x - 1, y, z - 1), randomGrid(x, y, z - 1), randomGrid(x + 1, y, z - 1), randomGrid(x + 2, y, z - 1), u);
445 | 		float x11 = cubic(randomGrid(x - 1, y, z), randomGrid(x, y, z), randomGrid(x + 1, y, z), randomGrid(x + 2, y, z), u);
446 | 		float x12 = cubic(randomGrid(x - 1, y, z + 1), randomGrid(x, y, z + 1), randomGrid(x + 1, y, z + 1), randomGrid(x + 2, y, z + 1), u);
447 | 		float x13 = cubic(randomGrid(x - 1, y, z + 2), randomGrid(x, y, z + 2), randomGrid(x + 1, y, z + 2), randomGrid(x + 2, y, z + 2), u);
448 | 
449 | 		float x20 = cubic(randomGrid(x - 1, y + 1, z - 1), randomGrid(x, y + 1, z - 1), randomGrid(x + 1, y + 1, z - 1), randomGrid(x + 2, y + 1, z - 1), u);
450 | 		float x21 = cubic(randomGrid(x - 1, y + 1, z), randomGrid(x, y + 1, z), randomGrid(x + 1, y + 1, z), randomGrid(x + 2, y + 1, z), u);
451 | 		float x22 = cubic(randomGrid(x - 1, y + 1, z + 1), randomGrid(x, y + 1, z + 1), randomGrid(x + 1, y + 1, z + 1), randomGrid(x + 2, y + 1, z + 1), u);
452 | 		float x23 = cubic(randomGrid(x - 1, y + 1, z + 2), randomGrid(x, y + 1, z + 2), randomGrid(x + 1, y + 1, z + 2), randomGrid(x + 2, y + 1, z + 2), u);
453 | 
454 | 		float x30 = cubic(randomGrid(x - 1, y + 2, z - 1), randomGrid(x, y + 2, z - 1), randomGrid(x + 1, y + 2, z - 1), randomGrid(x + 2, y + 2, z - 1), u);
455 | 		float x31 = cubic(randomGrid(x - 1, y + 2, z), randomGrid(x, y + 2, z), randomGrid(x + 1, y + 2, z), randomGrid(x + 2, y + 2, z), u);
456 | 		float x32 = cubic(randomGrid(x - 1, y + 2, z + 1), randomGrid(x, y + 2, z + 1), randomGrid(x + 1, y + 2, z + 1), randomGrid(x + 2, y + 2, z + 1), u);
457 | 		float x33 = cubic(randomGrid(x - 1, y + 2, z + 2), randomGrid(x, y + 2, z + 2), randomGrid(x + 1, y + 2, z + 2), randomGrid(x + 2, y + 2, z + 2), u);
458 | 
459 | 		// interpolate along y
460 | 		float y0 = cubic(x00, x10, x20, x30, v);
461 | 		float y1 = cubic(x01, x11, x21, x31, v);
462 | 		float y2 = cubic(x02, x12, x22, x32, v);
463 | 		float y3 = cubic(x03, x13, x23, x33, v);
464 | 
465 | 		// interpolate along z
466 | 		return cubic(y0, y1, y2, y3, w);
467 | 	}
468 | 
469 | 	// Discrete noise (nearest neighbor)
470 | 	__device__ float discreteNoise(float3 pos, float scale, int seed)
471 | 	{
472 | 		int ix = (int)(pos.x * scale);
473 | 		int iy = (int)(pos.y * scale);
474 | 		int iz = (int)(pos.z * scale);
475 | 
476 | 		return randomGrid(ix, iy, iz, seed);
477 | 	}
478 | 
479 | 	// Linear value noise
480 | 	__device__ float linearValue(float3 pos, float scale, int seed)
481 | 	{
482 | 		float fseed = (float)seed;
483 | 
484 | 		int ix = (int)pos.x;
485 | 		int iy = (int)pos.y;
486 | 		int iz = (int)pos.z;
487 | 
488 | 		float u = pos.x - ix;
489 | 		float v = pos.y - iy;
490 | 		float w = pos.z - iz;
491 | 
492 | 		// Corner values
493 | 		float a000 = randomGrid(ix, iy, iz, fseed);
494 | 		float a100 = randomGrid(ix + 1, iy, iz, fseed);
495 | 		float a010 = randomGrid(ix, iy + 1, iz, fseed);
496 | 		float a110 = randomGrid(ix + 1, iy + 1, iz, fseed);
497 | 		float a001 = randomGrid(ix, iy, iz + 1, fseed);
498 | 		float a101 = randomGrid(ix + 1, iy, iz + 1, fseed);
499 | 		float a011 = randomGrid(ix, iy + 1, iz + 1, fseed);
500 | 		float a111 = randomGrid(ix + 1, iy + 1, iz + 1, fseed);
501 | 
502 | 		// Linear interpolation
503 | 		float x00 = lerp(a000, a100, u);
504 | 		float x10 = lerp(a010, a110, u);
505 | 		float x01 = lerp(a001, a101, u);
506 | 		float x11 = lerp(a011, a111, u);
507 | 
508 | 		float y0 = lerp(x00, x10, v);
509 | 		float y1 = lerp(x01, x11, v);
510 | 
511 | 		return lerp(y0, y1, w);
512 | 	}
513 | 
514 | 	// Linear value noise smoothed with Perlin's fade function
515 | 	__device__ float fadedValue(float3 pos, float scale, int seed)
516 | 	{
517 | 		float fseed = (float)seed;
518 | 
519 | 		int ix = (int)(pos.x * scale);
520 | 		int iy = (int)(pos.y * scale);
521 | 		int iz = (int)(pos.z * scale);
522 | 
523 | 		float u = fade(pos.x - ix);
524 | 		float v = fade(pos.y - iy);
525 | 		float w = fade(pos.z - iz);
526 | 
527 | 		// Corner values
528 | 		float a000 = randomGrid(ix, iy, iz, fseed);
529 | 		float a100 = randomGrid(ix + 1, iy, iz, fseed);
530 | 		float a010 = randomGrid(ix, iy + 1, iz, fseed);
531 | 		float a110 = randomGrid(ix + 1, iy + 1, iz, fseed);
532 | 		float a001 = randomGrid(ix, iy, iz + 1, fseed);
533 | 		float a101 = randomGrid(ix + 1, iy, iz + 1, fseed);
534 | 		float a011 = randomGrid(ix, iy + 1, iz + 1, fseed);
535 | 		float a111 = randomGrid(ix + 1, iy + 1, iz + 1, fseed);
536 | 
537 | 		// Linear interpolation
538 | 		float x00 = lerp(a000, a100, u);
539 | 		float x10 = lerp(a010, a110, u);
540 | 		float x01 = lerp(a001, a101, u);
541 | 		float x11 = lerp(a011, a111, u);
542 | 
543 | 		float y0 = lerp(x00, x10, v);
544 | 		float y1 = lerp(x01, x11, v);
545 | 
546 | 		return lerp(y0, y1, w) / 2.0f * 1.0f;
547 | 	}
548 | 
549 | 	// Tricubic interpolated value noise
550 | 	__device__ float cubicValue(float3 pos, float scale, int seed)
551 | 	{
552 | 		pos.x = pos.x * scale;
553 | 		pos.y = pos.y * scale;
554 | 		pos.z = pos.z * scale;
555 | 
556 | 		int ix = (int)pos.x;
557 | 		int iy = (int)pos.y;
558 | 		int iz = (int)pos.z;
559 | 
560 | 		float u = pos.x - ix;
561 | 		float v = pos.y - iy;
562 | 		float w = pos.z - iz;
563 | 
564 | 		return tricubic(ix, iy, iz, u, v, w);
565 | 	}
566 | 
567 | 	// Perlin gradient noise
568 | 	__device__ float perlinNoise(float3 pos, float scale, int seed)
569 | 	{
570 | 		float fseed = (float)seed;
571 | 
572 | 		pos.x = pos.x * scale;
573 | 		pos.y = pos.y * scale;
574 | 		pos.z = pos.z * scale;
575 | 
576 | 		// zero corner integer position
577 | 		float ix = floorf(pos.x);
578 | 		float iy = floorf(pos.y);
579 | 		float iz = floorf(pos.z);
580 | 
581 | 		// current position within unit cube
582 | 		pos.x -= ix;
583 | 		pos.y -= iy;
584 | 		pos.z -= iz;
585 | 
586 | 		// adjust for fade
587 | 		float u = fade(pos.x);
588 | 		float v = fade(pos.y);
589 | 		float w = fade(pos.z);
590 | 
591 | 		// influence values
592 | 		float i000 = grad(randomIntGrid(ix, iy, iz, fseed), pos.x, pos.y, pos.z);
593 | 		float i100 = grad(randomIntGrid(ix + 1.0f, iy, iz, fseed), pos.x - 1.0f, pos.y, pos.z);
594 | 		float i010 = grad(randomIntGrid(ix, iy + 1.0f, iz, fseed), pos.x, pos.y - 1.0f, pos.z);
595 | 		float i110 = grad(randomIntGrid(ix + 1.0f, iy + 1.0f, iz, fseed), pos.x - 1.0f, pos.y - 1.0f, pos.z);
596 | 		float i001 = grad(randomIntGrid(ix, iy, iz + 1.0f, fseed), pos.x, pos.y, pos.z - 1.0f);
597 | 		float i101 = grad(randomIntGrid(ix + 1.0f, iy, iz + 1.0f, fseed), pos.x - 1.0f, pos.y, pos.z - 1.0f);
598 | 		float i011 = grad(randomIntGrid(ix, iy + 1.0f, iz + 1.0f, fseed), pos.x, pos.y - 1.0f, pos.z - 1.0f);
599 | 		float i111 = grad(randomIntGrid(ix + 1.0f, iy + 1.0f, iz + 1.0f, fseed), pos.x - 1.0f, pos.y - 1.0f, pos.z - 1.0f);
600 | 
601 | 		// interpolation
602 | 		float x00 = lerp(i000, i100, u);
603 | 		float x10 = lerp(i010, i110, u);
604 | 		float x01 = lerp(i001, i101, u);
605 | 		float x11 = lerp(i011, i111, u);
606 | 
607 | 		float y0 = lerp(x00, x10, v);
608 | 		float y1 = lerp(x01, x11, v);
609 | 
610 | 		float avg = lerp(y0, y1, w);
611 | 
612 | 		return avg;
613 | 	}
614 | 
615 | // Derived noise functions
616 | 
617 | 	// Fast function for fBm using perlin noise
618 | 	__device__ float repeaterPerlin(float3 pos, float scale, int seed, int n, float lacunarity, float decay)
619 | 	{
620 | 		float acc = 0.0f;
621 | 		float amp = 1.0f;
622 | 
623 | 		for (int i = 0; i < n; i++)
624 | 		{
625 | 			acc += perlinNoise(make_float3(pos.x * scale, pos.y * scale, pos.z * scale), 1.0f, (i + 38) * 27389482) * amp;
626 | 			scale *= lacunarity;
627 | 			amp *= decay;
628 | 		}
629 | 
630 | 		return acc;
631 | 	}
632 | 
633 |     // Fast function for fBm using perlin noise
634 |     __device__ float repeaterPerlinBounded(float3 pos, float scale, int seed, int n, float lacunarity, float decay, float threshold)
635 |     {
636 |         float acc = 1.0f;
637 |         float amp = 1.0f;
638 | 
639 |         for (int i = 0; i < n; i++)
640 |         {
641 |             acc *= 1.0f - __saturatef(0.5f + 0.5f * perlinNoise(make_float3(pos.x * scale, pos.y * scale, pos.z * scale), 1.0f, seed ^ ((i + 38) * 27389482))) * amp;
642 | 
643 |             if(acc < threshold)
644 |             {
645 |                 return 0.0f;
646 |             }
647 | 
648 |             scale *= lacunarity;
649 |             amp *= decay;
650 |         }
651 | 
652 |         return acc;
653 |     }
654 | 
655 |     // Fast function for fBm using perlin absolute noise
656 | 	// Originally called "turbulence", this method takes the absolute value of each octave before adding
657 | 	__device__ float repeaterPerlinAbs(float3 pos, float scale, int seed, int n, float lacunarity, float decay)
658 | 	{
659 | 		float acc = 0.0f;
660 | 		float amp = 1.0f;
661 | 
662 | 		for (int i = 0; i < n; i++)
663 | 		{
664 |                         acc += fabsf(perlinNoise(make_float3(pos.x * scale, pos.y * scale, pos.z * scale), 1.0f, seed)) * amp;
665 | 			scale *= lacunarity;
666 | 			amp *= decay;
667 | 		}
668 | 
669 | 		// Map the noise back to the standard expected range [-1, 1]
670 | 		return mapToSigned(acc);
671 | 	}
672 | 
673 | 	// Fast function for fBm using simplex noise
674 | 	__device__ float repeaterSimplex(float3 pos, float scale, int seed, int n, float lacunarity, float decay)
675 | 	{
676 | 		float acc = 0.0f;
677 | 		float amp = 1.0f;
678 | 
679 | 		for (int i = 0; i < n; i++)
680 | 		{
681 |             acc += simplexNoise(make_float3(pos.x, pos.y, pos.z), scale, seed) * amp * 0.35f;
682 | 			scale *= lacunarity;
683 | 			amp *= decay;
684 |             seed = seed ^ ((i + 672381) * 200394);
685 | 		}
686 | 
687 | 		return acc;
688 | 	}
689 | 
690 | 	// Fast function for fBm using simplex absolute noise
691 | 	__device__ float repeaterSimplexAbs(float3 pos, float scale, int seed, int n, float lacunarity, float decay)
692 | 	{
693 | 		float acc = 0.0f;
694 | 		float amp = 1.0f;
695 | 
696 | 		for (int i = 0; i < n; i++)
697 | 		{
698 | 			acc += fabsf(simplexNoise(make_float3(pos.x, pos.y, pos.z), scale, seed)) * amp * 0.35f;
699 | 			scale *= lacunarity;
700 | 			amp *= decay;
701 |             seed = seed ^ ((i + 198273) * 928374);
702 | 		}
703 | 
704 | 		return mapToSigned(acc);
705 | 	}
706 | 
707 | 	// Bounded simplex repeater
708 |     __device__ float repeaterSimplexBounded(float3 pos, float scale, int seed, int n, float lacunarity, float decay, float threshold)
709 |     {
710 |         float acc = 1.0f;
711 |         float amp = 1.0f;
712 | 
713 |         for (int i = 0; i < n; i++)
714 |         {
715 |             float val = __saturatef((simplexNoise(make_float3(pos.x * scale + 32240.7922f, pos.y * scale + 835622.882f, pos.z * scale + 824.371968f), 1.0f, seed) * 0.3f + 0.5f)) * amp;
716 |             acc -= val;
717 | 
718 |             if(acc < threshold)
719 |             {
720 |                 return 0.0f;
721 |             }
722 | 
723 |             scale *= lacunarity;
724 |             amp *= decay;
725 |         }
726 | 
727 |         return acc;
728 |     }
729 | 
730 |     // Generic fBm repeater
731 | 	// NOTE: about 10% slower than the dedicated repeater functions
732 | 	__device__ float repeater(float3 pos, float scale, int seed, int n, float lacunarity, float decay, basisFunction basis)
733 | 	{
734 | 		float acc = 0.0f;
735 | 		float amp = 1.0f;
736 | 
737 | 		for (int i = 0; i < n; i++)
738 | 		{
739 | 			switch (basis)
740 | 			{
741 | 			case(BASIS_CHECKER):
742 | 				acc += checker(make_float3(pos.x * scale + 53872.1923f, pos.y * scale + 58334.4081f, pos.z * scale + 9358.34667f), 1.0f, seed) * amp;
743 | 				break;
744 | 			case(BASIS_DISCRETE):
745 | 				acc += discreteNoise(make_float3(pos.x * scale + 7852.53114f, pos.y * scale + 319739.059f, pos.z * scale + 451336.504f), 1.0f, seed) * amp;
746 | 				break;
747 | 			case(BASIS_LINEARVALUE):
748 | 				acc += linearValue(make_float3(pos.x * scale + 940.748139f, pos.y * scale + 10196.4500f, pos.z * scale + 25650.9789f), 1.0f, seed) * amp;
749 | 				break;
750 | 			case(BASIS_FADEDVALUE):
751 | 				acc += fadedValue(make_float3(pos.x * scale + 7683.26428f, pos.y * scale + 2417.78195f, pos.z * scale + 93889.4897f), 1.0f, seed) * amp;
752 | 				break;
753 | 			case(BASIS_CUBICVALUE):
754 | 				acc += cubicValue(make_float3(pos.x * scale + 6546.80178f, pos.y * scale + 14459.4682f, pos.z * scale + 11616.5811f), 1.0f, seed) * amp;
755 | 				break;
756 | 			case(BASIS_PERLIN):
757 | 				acc += perlinNoise(make_float3(pos.x * scale + 1764.66931f, pos.y * scale + 2593.55017f, pos.z * scale + 4813.24412f), 1.0f, seed) * amp;
758 | 				break;
759 | 			case(BASIS_SIMPLEX):
760 | 				acc += simplexNoise(make_float3(pos.x * scale + 7442.93020f, pos.y * scale + 8341.06698f, pos.z * scale + 66848.7870f), 1.0f, seed) * amp;
761 | 				break;
762 | 			case(BASIS_WORLEY):
763 | 				acc += worleyNoise(make_float3(pos.x * scale + 7619.01285f, pos.y * scale + 57209.0681f, pos.z * scale + 1167.91397f), 1.0f, seed, 0.1f, 4, 4, 1.0f) * amp;
764 | 				break;
765 | 			case(BASIS_SPOTS):
766 | 				acc += spots(make_float3(pos.x * scale + 33836.4116f, pos.y * scale + 2242.51045f, pos.z * scale + 6720.07486f), 1.0f, seed, 0.1f, 0, 4, 1.0f, SHAPE_LINEAR) * amp;
767 | 				break;
768 | 			}
769 | 
770 | 			scale *= lacunarity;
771 | 			amp *= decay;
772 | 		}
773 | 
774 | 		return acc;
775 | 	}
776 | 
777 | 	// Fractal Simplex noise
778 | 	// Unlike the repeater function, which calculates a fixed number of noise octaves, the fractal function continues until
779 | 	// the feature size is smaller than one pixel
780 | 	__device__ float fractalSimplex(float3 pos, float scale, int seed, float du, int n, float lacunarity, float decay)
781 | 	{
782 | 		float acc = 0.0f;
783 | 		float amp = 1.0f;
784 | 
785 | 		float rdu = 1.0f / du;
786 | 
787 | 		for (int i = 0; i < n; i++)
788 | 		{
789 | 			acc += simplexNoise(make_float3(pos.x * scale + 617.437379f, pos.y * scale + 196410.219f, pos.z * scale + 321280.627f), 1.0f, seed * (i + 1)) * amp;
790 | 			scale *= lacunarity;
791 | 			amp *= decay;
792 | 
793 | 			if (scale > rdu)
794 | 				break;
795 | 		}
796 | 
797 | 		return acc;
798 | 	}
799 | 
800 | 	// Generic turbulence function
801 | 	// Uses a first pass of noise to offset the input vectors for the second pass
802 | 	__device__ float turbulence(float3 pos, float scaleIn, float scaleOut, int seed, float strength, basisFunction inFunc, basisFunction outFunc)
803 | 	{
804 | 		switch (inFunc)
805 | 		{
806 | 		case(BASIS_CHECKER):
807 | 			pos.x += checker(pos, scaleIn, seed ^ 0x34ff8885) * strength;
808 | 			pos.y += checker(pos, scaleIn, seed ^ 0x2d03cba3) * strength;
809 | 			pos.z += checker(pos, scaleIn, seed ^ 0x5a76fb1b) * strength;
810 | 			break;
811 | 		case(BASIS_LINEARVALUE):
812 | 			pos.x += linearValue(pos, scaleIn, seed ^ 0x5527fdb8) * strength;
813 | 			pos.y += linearValue(pos, scaleIn, seed ^ 0x42af1a2e) * strength;
814 | 			pos.z += linearValue(pos, scaleIn, seed ^ 0x1482ee8c) * strength;
815 | 			break;
816 | 		case(BASIS_FADEDVALUE):
817 | 			pos.x += fadedValue(pos, scaleIn, seed ^ 0x295590fc) * strength;
818 | 			pos.y += fadedValue(pos, scaleIn, seed ^ 0x30731854) * strength;
819 | 			pos.z += fadedValue(pos, scaleIn, seed ^ 0x73d2ca4c) * strength;
820 | 			break;
821 | 		case(BASIS_CUBICVALUE):
822 | 			pos.x += cubicValue(pos, scaleIn, seed ^ 0x663a1f09) * strength;
823 | 			pos.y += cubicValue(pos, scaleIn, seed ^ 0x429bf56b) * strength;
824 | 			pos.z += cubicValue(pos, scaleIn, seed ^ 0x37fa6fe9) * strength;
825 | 			break;
826 | 		case(BASIS_PERLIN):
827 | 			pos.x += perlinNoise(pos, scaleIn, seed ^ 0x74827384) * strength;
828 | 			pos.y += perlinNoise(pos, scaleIn, seed ^ 0x10938478) * strength;
829 | 			pos.z += perlinNoise(pos, scaleIn, seed ^ 0x62723883) * strength;
830 | 			break;
831 | 		case(BASIS_SIMPLEX):
832 | 			pos.x += simplexNoise(pos, scaleIn, seed ^ 0x47829472) * strength;
833 | 			pos.y += simplexNoise(pos, scaleIn, seed ^ 0x58273829) * strength;
834 | 			pos.z += simplexNoise(pos, scaleIn, seed ^ 0x10294647) * strength;
835 | 			break;
836 | 		case(BASIS_WORLEY):
837 | 			pos.x += worleyNoise(pos, scaleIn, seed ^ 0x1d96f515, 1.0f, 4, 4, 1.0f) * strength;
838 | 			pos.y += worleyNoise(pos, scaleIn, seed ^ 0x4df308f0, 1.0f, 4, 4, 1.0f) * strength;
839 | 			pos.z += worleyNoise(pos, scaleIn, seed ^ 0x2b79442a, 1.0f, 4, 4, 1.0f) * strength;
840 | 			break;
841 | 		}
842 | 
843 | 		switch (outFunc)
844 | 		{
845 | 		case(BASIS_CHECKER):
846 | 			return checker(pos, scaleOut, seed);
847 | 		case(BASIS_LINEARVALUE):
848 | 			return linearValue(pos, scaleOut, seed);
849 | 		case(BASIS_FADEDVALUE):
850 | 			return fadedValue(pos, scaleOut, seed);
851 | 		case(BASIS_CUBICVALUE):
852 | 			return cubicValue(pos, scaleOut, seed);
853 | 		case(BASIS_PERLIN):
854 | 			return perlinNoise(pos, scaleOut, seed);
855 | 		case(BASIS_SIMPLEX):
856 | 			return simplexNoise(pos, scaleIn, seed);
857 | 		case(BASIS_WORLEY):
858 | 			return worleyNoise(pos, scaleIn, seed, 1.0f, 4, 4, 1.0f);
859 | 		}
860 | 
861 | 		return 0.0f;
862 | 	}
863 | 
864 | 	// Turbulence using repeaters for the first and second pass
865 | 	__device__ float repeaterTurbulence(float3 pos, float scaleIn, float scaleOut, int seed, float strength, int n, basisFunction basisIn, basisFunction basisOut)
866 | 	{
867 | 		pos.x += (repeater(make_float3(pos.x, pos.y, pos.z), scaleIn, seed ^ 0x41728394, n, 2.0f, 0.5f, basisIn)) * strength;
868 | 		pos.y += (repeater(make_float3(pos.x, pos.y, pos.z), scaleIn, seed ^ 0x72837263, n, 2.0f, 0.5f, basisIn)) * strength;
869 | 		pos.z += (repeater(make_float3(pos.x, pos.y, pos.z), scaleIn, seed ^ 0x26837363, n, 2.0f, 0.5f, basisIn)) * strength;
870 | 
871 | 		return repeater(pos, scaleOut, seed ^ 0x3f821dab, n, 2.0f, 0.5f, basisOut);
872 | 	}
873 | 
874 | } // namespace
875 | 


--------------------------------------------------------------------------------