OWL
OptiX7 Wrapper Library
owl_device.h
Go to the documentation of this file.
1 // ======================================================================== //
2 // Copyright 2019-2020 Ingo Wald //
3 // //
4 // Licensed under the Apache License, Version 2.0 (the "License"); //
5 // you may not use this file except in compliance with the License. //
6 // You may obtain a copy of the License at //
7 // //
8 // http://www.apache.org/licenses/LICENSE-2.0 //
9 // //
10 // Unless required by applicable law or agreed to in writing, software //
11 // distributed under the License is distributed on an "AS IS" BASIS, //
12 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. //
13 // See the License for the specific language governing permissions and //
14 // limitations under the License. //
15 // ======================================================================== //
16 
17 #pragma once
18 
19 #include "owl/common/math/vec.h"
20 #include "owl/common/math/box.h"
21 // the 'actual' optix
22 #include <cuda.h>
23 #include <optix.h>
24 
25 // ==================================================================
26 // actual device-side "API" built-ins.
27 // ==================================================================
28 
29 #ifndef __CUDACC__
30 # error "this file should only ever get included on the device side"
31 #endif
32 
33 namespace owl {
34 
35  using namespace owl::common;
36 
37  inline __device__ vec2i getLaunchIndex()
38  {
39  return (vec2i)optixGetLaunchIndex();
40  }
41 
44  inline __device__ vec2i getLaunchDims()
45  {
46  return (vec2i)optixGetLaunchDimensions();
47  }
48 
53  inline __device__ const void *getProgramDataPointer()
54  {
55  return (const void*)optixGetSbtDataPointer();
56  }
57 
62  template<typename T>
63  inline __device__ const T &getProgramData()
64  {
65  return *(const T*)getProgramDataPointer();
66  }
67 
68 
69  // ==================================================================
70  // general convenience/helper functions - may move to samples
71  // ==================================================================
72  inline __device__ float linear_to_srgb(float x) {
73  if (x <= 0.0031308f) {
74  return 12.92f * x;
75  }
76  return 1.055f * pow(x, 1.f/2.4f) - 0.055f;
77  }
78 
79  inline __device__ uint32_t make_8bit(const float f)
80  {
81  return min(255,max(0,int(f*256.f)));
82  }
83 
84  inline __device__ uint32_t make_rgba(const vec3f color)
85  {
86  return
87  (make_8bit(color.x) << 0) +
88  (make_8bit(color.y) << 8) +
89  (make_8bit(color.z) << 16) +
90  (0xffU << 24);
91  }
92  inline __device__ uint32_t make_rgba(const vec4f color)
93  {
94  return
95  (make_8bit(color.x) << 0) +
96  (make_8bit(color.y) << 8) +
97  (make_8bit(color.z) << 16) +
98  (make_8bit(color.w) << 24);
99  }
100 
101 
102  static __forceinline__ __device__ void* unpackPointer( uint32_t i0, uint32_t i1 )
103  {
104  const uint64_t uptr = static_cast<uint64_t>( i0 ) << 32 | i1;
105  void* ptr = reinterpret_cast<void*>( uptr );
106  return ptr;
107  }
108 
109 
110  static __forceinline__ __device__ void packPointer( void* ptr, uint32_t& i0, uint32_t& i1 )
111  {
112  const uint64_t uptr = reinterpret_cast<uint64_t>( ptr );
113  i0 = uptr >> 32;
114  i1 = uptr & 0x00000000ffffffff;
115  }
116 
117 
118  static __forceinline__ __device__ void *getPRDPointer()
119  {
120  const uint32_t u0 = optixGetPayload_0();
121  const uint32_t u1 = optixGetPayload_1();
122  return unpackPointer(u0, u1);
123  }
124 
125  template<typename T>
126  static __forceinline__ __device__ T &getPRD()
127  { return *(T*)getPRDPointer(); }
128 
129  template<int _rayType=0, int _numRayTypes=1>
130  struct RayT {
131  enum { rayType = _rayType };
132  enum { numRayTypes = _numRayTypes };
133  inline __device__ RayT() {}
134  inline __device__ RayT(const vec3f &origin,
135  const vec3f &direction,
136  float tmin,
137  float tmax)
138  : origin(origin),
139  direction(direction),
140  tmin(tmin),
141  tmax(tmax)
142  {}
143 
144  vec3f origin, direction;
145  float tmin=0.f,tmax=1e30f,time=0.f;
146  };
147  typedef RayT<0,1> Ray;
148 
149 
150  template<typename RayType, typename PRD>
151  inline __device__
152  void traceRay(OptixTraversableHandle traversable,
153  const RayType &ray,
154  PRD &prd,
155  uint32_t rayFlags = 0u)
156  {
157  unsigned int p0 = 0;
158  unsigned int p1 = 0;
159  owl::packPointer(&prd,p0,p1);
160 
161  optixTrace(traversable,
162  (const float3&)ray.origin,
163  (const float3&)ray.direction,
164  ray.tmin,
165  ray.tmax,
166  ray.time,
167  (OptixVisibilityMask)-1,
168  /*rayFlags */rayFlags,
169  /*SBToffset */ray.rayType,
170  /*SBTstride */ray.numRayTypes,
171  /*missSBTIndex */ray.rayType,
172  p0,
173  p1);
174  }
175 
176  template<typename PRD>
177  inline __device__
178  void trace(OptixTraversableHandle traversable,
179  const Ray &ray,
180  int numRayTypes,
181  PRD &prd,
182  int sbtOffset = 0)
183  {
184  unsigned int p0 = 0;
185  unsigned int p1 = 0;
186  owl::packPointer(&prd,p0,p1);
187 
188  optixTrace(traversable,
189  (const float3&)ray.origin,
190  (const float3&)ray.direction,
191  ray.tmin,
192  ray.tmax,
193  ray.time,
194  (OptixVisibilityMask)-1,
195  /*rayFlags */0u,
196  /*SBToffset */ray.rayType + numRayTypes*sbtOffset,
197  /*SBTstride */numRayTypes,
198  /*missSBTIndex */ray.rayType,
199  p0,
200  p1);
201  }
202 
203 } // ::owl
204 
205 #define OPTIX_RAYGEN_PROGRAM(programName) \
206  extern "C" __global__ \
207  void __raygen__##programName
208 
209 #define OPTIX_CLOSEST_HIT_PROGRAM(programName) \
210  extern "C" __global__ \
211  void __closesthit__##programName
212 
213 #define OPTIX_ANY_HIT_PROGRAM(programName) \
214  extern "C" __global__ \
215  void __anyhit__##programName
216 
217 #define OPTIX_INTERSECT_PROGRAM(programName) \
218  extern "C" __global__ \
219  void __intersection__##programName
220 
221 #define OPTIX_MISS_PROGRAM(programName) \
222  extern "C" __global__ \
223  void __miss__##programName
224 
225 
226 
227 /* defines the wrapper stuff to actually launch all the bounds
228  programs from the host - todo: move to deviceAPI.h once working */
229 #define OPTIX_BOUNDS_PROGRAM(progName) \
230  /* fwd decl for the kernel func to call */ \
231  inline __device__ \
232  void __boundsFunc__##progName(const void *geomData, \
233  box3f &bounds, \
234  const int32_t primID); \
235  \
236  /* the '__global__' kernel we can get a function handle on */ \
237  extern "C" __global__ \
238  void __boundsFuncKernel__##progName(const void *geomData, \
239  box3f *const boundsArray, \
240  const uint32_t numPrims) \
241  { \
242  uint32_t blockIndex \
243  = blockIdx.x \
244  + blockIdx.y * gridDim.x \
245  + blockIdx.z * gridDim.x * gridDim.y; \
246  uint32_t primID \
247  = threadIdx.x + blockDim.x*threadIdx.y \
248  + blockDim.x*blockDim.y*blockIndex; \
249  if (primID < numPrims) { \
250  __boundsFunc__##progName(geomData,boundsArray[primID],primID); \
251  } \
252  } \
253  \
254  /* now the actual device code that the user is writing: */ \
255  inline __device__ void __boundsFunc__##progName \
256  /* program args and body supplied by user ... */
257 
258 
owl::getProgramData
__device__ const T & getProgramData()
Definition: owl_device.h:63
owl::unpackPointer
static __forceinline__ __device__ void * unpackPointer(uint32_t i0, uint32_t i1)
Definition: owl_device.h:102
optix.h
owl::traceRay
__device__ void traceRay(OptixTraversableHandle traversable, const RayType &ray, PRD &prd, uint32_t rayFlags=0u)
Definition: owl_device.h:152
owl::make_rgba
__device__ uint32_t make_rgba(const vec3f color)
Definition: owl_device.h:84
owl::RayT::tmax
float tmax
Definition: owl_device.h:145
owl::packPointer
static __forceinline__ __device__ void packPointer(void *ptr, uint32_t &i0, uint32_t &i1)
Definition: owl_device.h:110
cuda.h
owl::getPRDPointer
static __forceinline__ __device__ void * getPRDPointer()
Definition: owl_device.h:118
owl::RayT::RayT
__device__ RayT()
Definition: owl_device.h:133
box.h
owl::RayT
Definition: owl_device.h:130
owl::RayT::time
float time
Definition: owl_device.h:145
owl::RayT::direction
vec3f direction
Definition: owl_device.h:144
owl::getLaunchDims
__device__ vec2i getLaunchDims()
Definition: owl_device.h:44
owl::linear_to_srgb
__device__ float linear_to_srgb(float x)
Definition: owl_device.h:72
owl::Ray
RayT< 0, 1 > Ray
Definition: owl_device.h:147
owl::common
Definition: array2D.h:22
owl::RayT::RayT
__device__ RayT(const vec3f &origin, const vec3f &direction, float tmin, float tmax)
Definition: owl_device.h:134
owl::trace
__device__ void trace(OptixTraversableHandle traversable, const Ray &ray, int numRayTypes, PRD &prd, int sbtOffset=0)
Definition: owl_device.h:178
owl::make_8bit
__device__ uint32_t make_8bit(const float f)
Definition: owl_device.h:79
vec.h
owl::RayT::origin
vec3f origin
Definition: owl_device.h:144
owl
Definition: APIContext.cpp:36
owl::getLaunchIndex
__device__ vec2i getLaunchIndex()
Definition: owl_device.h:37
owl::getProgramDataPointer
__device__ const void * getProgramDataPointer()
Definition: owl_device.h:53
owl::getPRD
static __forceinline__ __device__ T & getPRD()
Definition: owl_device.h:126
owl::RayT::rayType
@ rayType
Definition: owl_device.h:131
owl::RayT::tmin
float tmin
Definition: owl_device.h:145