Blender V4.3
kernel/device/oneapi/kernel.cpp
Go to the documentation of this file.
1/* SPDX-FileCopyrightText: 2021-2022 Intel Corporation
2 *
3 * SPDX-License-Identifier: Apache-2.0 */
4
5#ifdef WITH_ONEAPI
6
7# include "kernel.h"
8# include <iostream>
9# include <map>
10# include <set>
11
12/* <algorithm> is needed until included upstream in sycl/detail/property_list_base.hpp */
13# include <algorithm>
14# include <sycl/sycl.hpp>
15
19
21
22# include "device/kernel.cpp"
23
24static OneAPIErrorCallback s_error_cb = nullptr;
25static void *s_error_user_ptr = nullptr;
26
27# ifdef WITH_EMBREE_GPU
28static const RTCFeatureFlags CYCLES_ONEAPI_EMBREE_BASIC_FEATURES = (const RTCFeatureFlags)(
29 RTC_FEATURE_FLAG_TRIANGLE | RTC_FEATURE_FLAG_INSTANCE |
30 RTC_FEATURE_FLAG_FILTER_FUNCTION_IN_ARGUMENTS | RTC_FEATURE_FLAG_POINT |
31 RTC_FEATURE_FLAG_MOTION_BLUR);
32static const RTCFeatureFlags CYCLES_ONEAPI_EMBREE_ALL_FEATURES = (const RTCFeatureFlags)(
33 CYCLES_ONEAPI_EMBREE_BASIC_FEATURES | RTC_FEATURE_FLAG_ROUND_CATMULL_ROM_CURVE |
34 RTC_FEATURE_FLAG_FLAT_CATMULL_ROM_CURVE);
35# endif
36
37void oneapi_set_error_cb(OneAPIErrorCallback cb, void *user_ptr)
38{
39 s_error_cb = cb;
40 s_error_user_ptr = user_ptr;
41}
42
43size_t oneapi_suggested_gpu_kernel_size(const DeviceKernel kernel)
44{
45 /* This defines are available only to the device code, so making this function
46 * seems to be the most reasonable way to provide access to them for the host code. */
47 switch (kernel) {
56
61
65
68
69 default:
70 return (size_t)0;
71 }
72}
73
74/* NOTE(@nsirgien): Execution of this simple kernel will check basic functionality like
75 * memory allocations, memory transfers and execution of kernel with USM memory. */
76bool oneapi_run_test_kernel(SyclQueue *queue_)
77{
78 assert(queue_);
79 sycl::queue *queue = reinterpret_cast<sycl::queue *>(queue_);
80 const size_t N = 8;
81 const size_t memory_byte_size = sizeof(int) * N;
82
83 bool is_computation_correct = true;
84 try {
85 int *A_host = (int *)sycl::aligned_alloc_host(16, memory_byte_size, *queue);
86
87 for (size_t i = (size_t)0; i < N; i++) {
88 A_host[i] = rand() % 32;
89 }
90
91 int *A_device = (int *)sycl::malloc_device(memory_byte_size, *queue);
92 int *B_device = (int *)sycl::malloc_device(memory_byte_size, *queue);
93
94 queue->memcpy(A_device, A_host, memory_byte_size);
95 queue->wait_and_throw();
96
97 queue->submit([&](sycl::handler &cgh) {
98 cgh.parallel_for(N, [=](sycl::id<1> idx) { B_device[idx] = A_device[idx] + idx.get(0); });
99 });
100 queue->wait_and_throw();
101
102 int *B_host = (int *)sycl::aligned_alloc_host(16, memory_byte_size, *queue);
103
104 queue->memcpy(B_host, B_device, memory_byte_size);
105 queue->wait_and_throw();
106
107 for (size_t i = (size_t)0; i < N; i++) {
108 const int expected_result = i + A_host[i];
109 if (B_host[i] != expected_result) {
110 is_computation_correct = false;
111 if (s_error_cb) {
112 s_error_cb(("Incorrect result in test kernel execution - expected " +
113 std::to_string(expected_result) + ", got " + std::to_string(B_host[i]))
114 .c_str(),
115 s_error_user_ptr);
116 }
117 }
118 }
119
120 sycl::free(A_host, *queue);
121 sycl::free(B_host, *queue);
122 sycl::free(A_device, *queue);
123 sycl::free(B_device, *queue);
124 queue->wait_and_throw();
125 }
126 catch (sycl::exception const &e) {
127 if (s_error_cb) {
128 s_error_cb(e.what(), s_error_user_ptr);
129 }
130 return false;
131 }
132
133 return is_computation_correct;
134}
135
136bool oneapi_zero_memory_on_device(SyclQueue *queue_, void *device_pointer, size_t num_bytes)
137{
138 assert(queue_);
139 sycl::queue *queue = reinterpret_cast<sycl::queue *>(queue_);
140 try {
141 queue->memset(device_pointer, 0, num_bytes);
142 queue->wait_and_throw();
143 return true;
144 }
145 catch (sycl::exception const &e) {
146 if (s_error_cb) {
147 s_error_cb(e.what(), s_error_user_ptr);
148 }
149 return false;
150 }
151}
152
153bool oneapi_kernel_is_required_for_features(const std::string &kernel_name,
154 const uint kernel_features)
155{
156 /* Skip all non-Cycles kernels */
157 if (kernel_name.find("oneapi_kernel_") == std::string::npos) {
158 return false;
159 }
160
161 if ((kernel_features & KERNEL_FEATURE_NODE_RAYTRACE) == 0 &&
163 std::string::npos)
164 {
165 return false;
166 }
167
168 if ((kernel_features & KERNEL_FEATURE_MNEE) == 0 &&
170 std::string::npos)
171 {
172 return false;
173 }
174
175 if ((kernel_features & KERNEL_FEATURE_VOLUME) == 0 &&
177 std::string::npos)
178 {
179 return false;
180 }
181
182 if (((kernel_features & (KERNEL_FEATURE_PATH_TRACING | KERNEL_FEATURE_BAKING)) == 0) &&
184 std::string::npos) ||
186 std::string::npos) ||
188 std::string::npos) ||
189 (kernel_name.find(device_kernel_as_string(
191 {
192 return false;
193 }
194
195 return true;
196}
197
198bool oneapi_kernel_is_compatible_with_hardware_raytracing(const std::string &kernel_name)
199{
200 /* MNEE and Ray-trace kernels work correctly with Hardware Ray-tracing starting with Embree 4.1.
201 */
202# if defined(RTC_VERSION) && RTC_VERSION < 40100
204 std::string::npos) &&
205 (kernel_name.find(device_kernel_as_string(
207# else
208 return true;
209# endif
210}
211
212bool oneapi_kernel_has_intersections(const std::string &kernel_name)
213{
214 for (int i = 0; i < (int)DEVICE_KERNEL_NUM; i++) {
215 DeviceKernel kernel = (DeviceKernel)i;
216 if (device_kernel_has_intersection(kernel)) {
217 if (kernel_name.find(device_kernel_as_string(kernel)) != std::string::npos) {
218 return true;
219 }
220 }
221 }
222 return false;
223}
224
225bool oneapi_load_kernels(SyclQueue *queue_,
226 const uint kernel_features,
227 bool use_hardware_raytracing)
228{
229 assert(queue_);
230 sycl::queue *queue = reinterpret_cast<sycl::queue *>(queue_);
231
232# ifdef WITH_EMBREE_GPU
233 /* For best performance, we always JIT compile the kernels that are using Embree. */
234 if (use_hardware_raytracing) {
235 try {
236 sycl::kernel_bundle<sycl::bundle_state::input> all_kernels_bundle =
237 sycl::get_kernel_bundle<sycl::bundle_state::input>(queue->get_context(),
238 {queue->get_device()});
239
240 for (const sycl::kernel_id &kernel_id : all_kernels_bundle.get_kernel_ids()) {
241 const std::string &kernel_name = kernel_id.get_name();
242
243 if (!oneapi_kernel_is_required_for_features(kernel_name, kernel_features) ||
244 !(oneapi_kernel_has_intersections(kernel_name) &&
245 oneapi_kernel_is_compatible_with_hardware_raytracing(kernel_name)))
246 {
247 continue;
248 }
249
250 sycl::kernel_bundle<sycl::bundle_state::input> one_kernel_bundle_input =
251 sycl::get_kernel_bundle<sycl::bundle_state::input>(queue->get_context(), {kernel_id});
252
253 /* Hair requires embree curves support. */
254 if (kernel_features & KERNEL_FEATURE_HAIR) {
255 one_kernel_bundle_input
256 .set_specialization_constant<ONEAPIKernelContext::oneapi_embree_features>(
257 CYCLES_ONEAPI_EMBREE_ALL_FEATURES);
258 sycl::build(one_kernel_bundle_input);
259 }
260 else {
261 one_kernel_bundle_input
262 .set_specialization_constant<ONEAPIKernelContext::oneapi_embree_features>(
263 CYCLES_ONEAPI_EMBREE_BASIC_FEATURES);
264 sycl::build(one_kernel_bundle_input);
265 }
266 }
267 }
268 catch (sycl::exception const &e) {
269 if (s_error_cb) {
270 s_error_cb(e.what(), s_error_user_ptr);
271 }
272 return false;
273 }
274 }
275# endif
276
277 try {
278 sycl::kernel_bundle<sycl::bundle_state::input> all_kernels_bundle =
279 sycl::get_kernel_bundle<sycl::bundle_state::input>(queue->get_context(),
280 {queue->get_device()});
281
282 for (const sycl::kernel_id &kernel_id : all_kernels_bundle.get_kernel_ids()) {
283 const std::string &kernel_name = kernel_id.get_name();
284
285 /* In case HWRT is on, compilation of kernels using Embree is already handled in previous
286 * block. */
287 if (!oneapi_kernel_is_required_for_features(kernel_name, kernel_features) ||
288 (use_hardware_raytracing && oneapi_kernel_has_intersections(kernel_name) &&
289 oneapi_kernel_is_compatible_with_hardware_raytracing(kernel_name)))
290 {
291 continue;
292 }
293
294# ifdef WITH_EMBREE_GPU
295 if (oneapi_kernel_has_intersections(kernel_name)) {
296 sycl::kernel_bundle<sycl::bundle_state::input> one_kernel_bundle_input =
297 sycl::get_kernel_bundle<sycl::bundle_state::input>(queue->get_context(), {kernel_id});
298 one_kernel_bundle_input
299 .set_specialization_constant<ONEAPIKernelContext::oneapi_embree_features>(
300 RTC_FEATURE_FLAG_NONE);
301 sycl::build(one_kernel_bundle_input);
302 continue;
303 }
304# endif
305 /* This call will ensure that AoT or cached JIT binaries are available
306 * for execution. It will trigger compilation if it is not already the case. */
307 (void)sycl::get_kernel_bundle<sycl::bundle_state::executable>(queue->get_context(),
308 {kernel_id});
309 }
310 }
311 catch (sycl::exception const &e) {
312 if (s_error_cb) {
313 s_error_cb(e.what(), s_error_user_ptr);
314 }
315 return false;
316 }
317 return true;
318}
319
320bool oneapi_enqueue_kernel(KernelContext *kernel_context,
321 int kernel,
322 size_t global_size,
323 size_t local_size,
324 const uint kernel_features,
325 bool use_hardware_raytracing,
326 void **args)
327{
328 bool success = true;
329 ::DeviceKernel device_kernel = (::DeviceKernel)kernel;
330 KernelGlobalsGPU *kg = (KernelGlobalsGPU *)kernel_context->kernel_globals;
331 sycl::queue *queue = reinterpret_cast<sycl::queue *>(kernel_context->queue);
332 assert(queue);
333 if (!queue) {
334 return false;
335 }
336
337 /* Let the compiler throw an error if there are any kernels missing in this implementation. */
338# if defined(_WIN32)
339# pragma warning(error : 4062)
340# elif defined(__GNUC__)
341# pragma GCC diagnostic push
342# pragma GCC diagnostic error "-Wswitch"
343# endif
344
345 int max_shaders = 0;
346
347 if (device_kernel == DEVICE_KERNEL_INTEGRATOR_SORT_BUCKET_PASS ||
349 {
350 max_shaders = (kernel_context->scene_max_shaders);
351 }
352
353 try {
354 queue->submit([&](sycl::handler &cgh) {
355# ifdef WITH_EMBREE_GPU
356 /* Spec says it has no effect if the called kernel doesn't support the below specialization
357 * constant but it can still trigger a recompilation, so we set it only if needed. */
358 if (device_kernel_has_intersection(device_kernel)) {
359 const RTCFeatureFlags used_embree_features = !use_hardware_raytracing ?
360 RTC_FEATURE_FLAG_NONE :
361 !(kernel_features & KERNEL_FEATURE_HAIR) ?
362 CYCLES_ONEAPI_EMBREE_BASIC_FEATURES :
363 CYCLES_ONEAPI_EMBREE_ALL_FEATURES;
364 cgh.set_specialization_constant<ONEAPIKernelContext::oneapi_embree_features>(
365 used_embree_features);
366 }
367# else
368 (void)kernel_features;
369# endif
370 switch (device_kernel) {
372 oneapi_call(kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_reset);
373 break;
374 }
376 oneapi_call(
377 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_init_from_camera);
378 break;
379 }
381 oneapi_call(
382 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_init_from_bake);
383 break;
384 }
386 oneapi_call(
387 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_intersect_closest);
388 break;
389 }
391 oneapi_call(
392 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_intersect_shadow);
393 break;
394 }
396 oneapi_call(kg,
397 cgh,
398 global_size,
399 local_size,
400 args,
401 oneapi_kernel_integrator_intersect_subsurface);
402 break;
403 }
405 oneapi_call(kg,
406 cgh,
407 global_size,
408 local_size,
409 args,
410 oneapi_kernel_integrator_intersect_volume_stack);
411 break;
412 }
414 oneapi_call(kg,
415 cgh,
416 global_size,
417 local_size,
418 args,
419 oneapi_kernel_integrator_intersect_dedicated_light);
420 break;
421 }
423 oneapi_call(
424 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_shade_background);
425 break;
426 }
428 oneapi_call(
429 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_shade_light);
430 break;
431 }
433 oneapi_call(
434 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_shade_shadow);
435 break;
436 }
438 oneapi_call(
439 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_shade_surface);
440 break;
441 }
443 oneapi_call(kg,
444 cgh,
445 global_size,
446 local_size,
447 args,
448 oneapi_kernel_integrator_shade_surface_raytrace);
449 break;
450 }
452 oneapi_call(
453 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_shade_surface_mnee);
454 break;
455 }
457 oneapi_call(
458 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_shade_volume);
459 break;
460 }
462 oneapi_call(kg,
463 cgh,
464 global_size,
465 local_size,
466 args,
467 oneapi_kernel_integrator_shade_dedicated_light);
468 break;
469 }
471 oneapi_call(
472 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_queued_paths_array);
473 break;
474 }
476 oneapi_call(kg,
477 cgh,
478 global_size,
479 local_size,
480 args,
481 oneapi_kernel_integrator_queued_shadow_paths_array);
482 break;
483 }
485 oneapi_call(
486 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_active_paths_array);
487 break;
488 }
490 oneapi_call(kg,
491 cgh,
492 global_size,
493 local_size,
494 args,
495 oneapi_kernel_integrator_terminated_paths_array);
496 break;
497 }
499 oneapi_call(kg,
500 cgh,
501 global_size,
502 local_size,
503 args,
504 oneapi_kernel_integrator_terminated_shadow_paths_array);
505 break;
506 }
508 oneapi_call(
509 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_sorted_paths_array);
510 break;
511 }
513 sycl::local_accessor<int> local_mem(max_shaders, cgh);
514 oneapi_kernel_integrator_sort_bucket_pass(kg,
515 global_size,
516 local_size,
517 cgh,
518 *(int *)(args[0]),
519 *(int *)(args[1]),
520 *(int *)(args[2]),
521 *(int **)(args[3]),
522 *(int *)(args[4]),
523 local_mem);
524 break;
525 }
527 sycl::local_accessor<int> local_mem(max_shaders, cgh);
528 oneapi_kernel_integrator_sort_write_pass(kg,
529 global_size,
530 local_size,
531 cgh,
532 *(int *)(args[0]),
533 *(int *)(args[1]),
534 *(int *)(args[2]),
535 *(int **)(args[3]),
536 *(int *)(args[4]),
537 local_mem);
538 break;
539 }
541 oneapi_call(kg,
542 cgh,
543 global_size,
544 local_size,
545 args,
546 oneapi_kernel_integrator_compact_paths_array);
547 break;
548 }
550 oneapi_call(kg,
551 cgh,
552 global_size,
553 local_size,
554 args,
555 oneapi_kernel_integrator_compact_shadow_paths_array);
556 break;
557 }
559 oneapi_call(kg,
560 cgh,
561 global_size,
562 local_size,
563 args,
564 oneapi_kernel_adaptive_sampling_convergence_check);
565 break;
566 }
568 oneapi_call(
569 kg, cgh, global_size, local_size, args, oneapi_kernel_adaptive_sampling_filter_x);
570 break;
571 }
573 oneapi_call(
574 kg, cgh, global_size, local_size, args, oneapi_kernel_adaptive_sampling_filter_y);
575 break;
576 }
578 oneapi_call(kg, cgh, global_size, local_size, args, oneapi_kernel_shader_eval_displace);
579 break;
580 }
582 oneapi_call(
583 kg, cgh, global_size, local_size, args, oneapi_kernel_shader_eval_background);
584 break;
585 }
587 oneapi_call(kg,
588 cgh,
589 global_size,
590 local_size,
591 args,
592 oneapi_kernel_shader_eval_curve_shadow_transparency);
593 break;
594 }
596 oneapi_call(kg, cgh, global_size, local_size, args, oneapi_kernel_prefix_sum);
597 break;
598 }
599
600 /* clang-format off */
601 # define DEVICE_KERNEL_FILM_CONVERT_PARTIAL(VARIANT, variant) \
602 case DEVICE_KERNEL_FILM_CONVERT_##VARIANT: { \
603 oneapi_call(kg, cgh, \
604 global_size, \
605 local_size, \
606 args, \
607 oneapi_kernel_film_convert_##variant); \
608 break; \
609 }
610
611# define DEVICE_KERNEL_FILM_CONVERT(variant, VARIANT) \
612 DEVICE_KERNEL_FILM_CONVERT_PARTIAL(VARIANT, variant) \
613 DEVICE_KERNEL_FILM_CONVERT_PARTIAL(VARIANT##_HALF_RGBA, variant##_half_rgba)
614
615 DEVICE_KERNEL_FILM_CONVERT(depth, DEPTH);
616 DEVICE_KERNEL_FILM_CONVERT(mist, MIST);
617 DEVICE_KERNEL_FILM_CONVERT(sample_count, SAMPLE_COUNT);
618 DEVICE_KERNEL_FILM_CONVERT(float, FLOAT);
619 DEVICE_KERNEL_FILM_CONVERT(light_path, LIGHT_PATH);
620 DEVICE_KERNEL_FILM_CONVERT(float3, FLOAT3);
621 DEVICE_KERNEL_FILM_CONVERT(motion, MOTION);
622 DEVICE_KERNEL_FILM_CONVERT(cryptomatte, CRYPTOMATTE);
623 DEVICE_KERNEL_FILM_CONVERT(shadow_catcher, SHADOW_CATCHER);
624 DEVICE_KERNEL_FILM_CONVERT(shadow_catcher_matte_with_shadow,
625 SHADOW_CATCHER_MATTE_WITH_SHADOW);
626 DEVICE_KERNEL_FILM_CONVERT(combined, COMBINED);
627 DEVICE_KERNEL_FILM_CONVERT(float4, FLOAT4);
628
629# undef DEVICE_KERNEL_FILM_CONVERT
630# undef DEVICE_KERNEL_FILM_CONVERT_PARTIAL
631 /* clang-format on */
632
634 oneapi_call(
635 kg, cgh, global_size, local_size, args, oneapi_kernel_filter_guiding_preprocess);
636 break;
637 }
639 oneapi_call(kg,
640 cgh,
641 global_size,
642 local_size,
643 args,
644 oneapi_kernel_filter_guiding_set_fake_albedo);
645 break;
646 }
648 oneapi_call(
649 kg, cgh, global_size, local_size, args, oneapi_kernel_filter_color_preprocess);
650 break;
651 }
653 oneapi_call(
654 kg, cgh, global_size, local_size, args, oneapi_kernel_filter_color_postprocess);
655 break;
656 }
658 oneapi_call(
659 kg, cgh, global_size, local_size, args, oneapi_kernel_cryptomatte_postprocess);
660 break;
661 }
663 oneapi_call(
664 kg, cgh, global_size, local_size, args, oneapi_kernel_integrator_compact_states);
665 break;
666 }
668 oneapi_call(kg,
669 cgh,
670 global_size,
671 local_size,
672 args,
673 oneapi_kernel_integrator_compact_shadow_states);
674 break;
675 }
677 oneapi_call(kg,
678 cgh,
679 global_size,
680 local_size,
681 args,
682 oneapi_kernel_integrator_shadow_catcher_count_possible_splits);
683 break;
684 }
685 /* Unsupported kernels */
688 kernel_assert(0);
689 break;
690 }
691 });
692 }
693 catch (sycl::exception const &e) {
694 if (s_error_cb) {
695 s_error_cb(e.what(), s_error_user_ptr);
696 success = false;
697 }
698 }
699
700# if defined(_WIN32)
701# pragma warning(default : 4062)
702# elif defined(__GNUC__)
703# pragma GCC diagnostic pop
704# endif
705 return success;
706}
707
708#endif /* WITH_ONEAPI */
unsigned int uint
ATTR_WARN_UNUSED_RESULT const BMVert const BMEdge * e
#define kernel_assert(cond)
bool device_kernel_has_intersection(DeviceKernel kernel)
const char * device_kernel_as_string(DeviceKernel kernel)
draw_view push_constant(Type::INT, "radiance_src") .push_constant(Type capture_info_buf storage_buf(1, Qualifier::READ, "ObjectBounds", "bounds_buf[]") .push_constant(Type draw_view int
#define KERNEL_FEATURE_VOLUME
#define KERNEL_FEATURE_PATH_TRACING
#define KERNEL_FEATURE_HAIR
#define KERNEL_FEATURE_NODE_RAYTRACE
#define KERNEL_FEATURE_BAKING
#define KERNEL_FEATURE_MNEE
DeviceKernel
@ DEVICE_KERNEL_ADAPTIVE_SAMPLING_CONVERGENCE_CHECK
@ DEVICE_KERNEL_INTEGRATOR_RESET
@ DEVICE_KERNEL_INTEGRATOR_QUEUED_PATHS_ARRAY
@ DEVICE_KERNEL_INTEGRATOR_SHADE_LIGHT
@ DEVICE_KERNEL_INTEGRATOR_SHADE_DEDICATED_LIGHT
@ DEVICE_KERNEL_FILTER_COLOR_PREPROCESS
@ DEVICE_KERNEL_INTEGRATOR_SHADE_SURFACE
@ DEVICE_KERNEL_INTEGRATOR_SORT_WRITE_PASS
@ DEVICE_KERNEL_SHADER_EVAL_DISPLACE
@ DEVICE_KERNEL_INTEGRATOR_SHADOW_CATCHER_COUNT_POSSIBLE_SPLITS
@ DEVICE_KERNEL_INTEGRATOR_INTERSECT_SUBSURFACE
@ DEVICE_KERNEL_INTEGRATOR_QUEUED_SHADOW_PATHS_ARRAY
@ DEVICE_KERNEL_FILTER_GUIDING_SET_FAKE_ALBEDO
@ DEVICE_KERNEL_FILTER_COLOR_POSTPROCESS
@ DEVICE_KERNEL_INTEGRATOR_SHADE_SHADOW
@ DEVICE_KERNEL_INTEGRATOR_TERMINATED_PATHS_ARRAY
@ DEVICE_KERNEL_INTEGRATOR_INTERSECT_VOLUME_STACK
@ DEVICE_KERNEL_SHADER_EVAL_BACKGROUND
@ DEVICE_KERNEL_INTEGRATOR_SORTED_PATHS_ARRAY
@ DEVICE_KERNEL_INTEGRATOR_COMPACT_SHADOW_PATHS_ARRAY
@ DEVICE_KERNEL_INTEGRATOR_COMPACT_SHADOW_STATES
@ DEVICE_KERNEL_INTEGRATOR_SHADE_SURFACE_RAYTRACE
@ DEVICE_KERNEL_INTEGRATOR_SORT_BUCKET_PASS
@ DEVICE_KERNEL_INTEGRATOR_INTERSECT_DEDICATED_LIGHT
@ DEVICE_KERNEL_FILTER_GUIDING_PREPROCESS
@ DEVICE_KERNEL_INTEGRATOR_COMPACT_STATES
@ DEVICE_KERNEL_INTEGRATOR_SHADE_SURFACE_MNEE
@ DEVICE_KERNEL_INTEGRATOR_TERMINATED_SHADOW_PATHS_ARRAY
@ DEVICE_KERNEL_INTEGRATOR_MEGAKERNEL
@ DEVICE_KERNEL_NUM
@ DEVICE_KERNEL_INTEGRATOR_ACTIVE_PATHS_ARRAY
@ DEVICE_KERNEL_INTEGRATOR_INIT_FROM_CAMERA
@ DEVICE_KERNEL_ADAPTIVE_SAMPLING_CONVERGENCE_FILTER_Y
@ DEVICE_KERNEL_ADAPTIVE_SAMPLING_CONVERGENCE_FILTER_X
@ DEVICE_KERNEL_CRYPTOMATTE_POSTPROCESS
@ DEVICE_KERNEL_INTEGRATOR_COMPACT_PATHS_ARRAY
@ DEVICE_KERNEL_INTEGRATOR_INIT_FROM_BAKE
@ DEVICE_KERNEL_SHADER_EVAL_CURVE_SHADOW_TRANSPARENCY
@ DEVICE_KERNEL_INTEGRATOR_SHADE_VOLUME
@ DEVICE_KERNEL_INTEGRATOR_INTERSECT_SHADOW
@ DEVICE_KERNEL_INTEGRATOR_INTERSECT_CLOSEST
@ DEVICE_KERNEL_INTEGRATOR_SHADE_BACKGROUND
@ DEVICE_KERNEL_PREFIX_SUM
#define N
#define GPU_PARALLEL_ACTIVE_INDEX_DEFAULT_BLOCK_SIZE
#define GPU_PARALLEL_PREFIX_SUM_DEFAULT_BLOCK_SIZE
#define GPU_PARALLEL_SORTED_INDEX_DEFAULT_BLOCK_SIZE
#define GPU_PARALLEL_SORT_BLOCK_SIZE
@ FLOAT4
@ FLOAT3
@ FLOAT