#pragma once

namespace Slang
{

/*
This pass will lower all immutable buffer loads into CUDA `__ldg` intrinsic calls
to make sure these loads are performed through the read-only data cache on the GPU
for better performance.
*/

struct IRModule;
class TargetProgram;

void lowerImmutableBufferLoadForCUDA(TargetProgram* targetProgram, IRModule* module);

} // namespace Slang