summaryrefslogtreecommitdiff
path: root/src/random.h
blob: e9d2e759d612163d47527d73614521ef6ea80500 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
#ifndef __RANDOM_H__
#define __RANDOM_H__

#include <curand_kernel.h>

#include "physical_constants.h"

__device__ float
uniform(curandState *s, const float &low, const float &high)
{
    return low + curand_uniform(s)*(high-low);
}

__device__ float3
uniform_sphere(curandState *s)
{
    float theta = uniform(s, 0.0f, 2*PI);
    float u = uniform(s, -1.0f, 1.0f);
    float c = sqrtf(1.0f-u*u);

    return make_float3(c*cosf(theta), c*sinf(theta), u);
}

// Draw a random sample given a cumulative distribution function
// Assumptions: ncdf >= 2, cdf_y[0] is 0.0, and cdf_y[ncdf-1] is 1.0
__device__ float
sample_cdf(curandState *rng, int ncdf, float *cdf_x, float *cdf_y)
{
    float u = curand_uniform(rng);

    // Find u in cdf_y with binary search
    // list must contain at least 2 elements: 0.0 and 1.0
    int lower=0;
    int upper=ncdf-1;
    while(lower < upper-1) {
	int half = (lower+upper) / 2;
	if (u < cdf_y[half])
	    upper = half;
	else
	    lower = half;
    }
  
    float frac = (u - cdf_y[lower]) / (cdf_y[upper] - cdf_y[lower]);
    return cdf_x[lower] * frac + cdf_x[upper] * (1.0f - frac);
}

extern "C"
{

__global__ void
init_rng(int nthreads, curandState *s, unsigned long long seed,
	 unsigned long long offset)
{
    int id = blockIdx.x*blockDim.x + threadIdx.x;

    if (id >= nthreads)
	return;

    curand_init(seed, id, offset, &s[id]);
}

__global__ void
fill_uniform(int nthreads, curandState *s, float *a, float low, float high)
{
    int id = blockIdx.x*blockDim.x + threadIdx.x;

    if (id >= nthreads)
	return;

    a[id] = uniform(&s[id], low, high);

}

__global__ void
fill_uniform_sphere(int nthreads, curandState *s, float3 *a)
{
    int id = blockIdx.x*blockDim.x + threadIdx.x;

    if (id >= nthreads)
	return;

    a[id] = uniform_sphere(&s[id]);
}

} // extern "c"

#endif