blob: adaa58dc86c06face9a01b6d63a10e1a3511f1d4 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
|
#pragma once
namespace Slang
{
/*
This pass will lower all immutable buffer loads into CUDA `__ldg` intrinsic calls
to make sure these loads are performed through the read-only data cache on the GPU
for better performance.
*/
struct IRModule;
class TargetProgram;
void lowerImmutableBufferLoadForCUDA(TargetProgram* targetProgram, IRModule* module);
} // namespace Slang
|