summaryrefslogtreecommitdiff
path: root/tools/gfx-unit-test/shared-buffers-tests.cpp
blob: ccd223fc07421607f671f41726bf20a5bf3d3736 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
#include "tools/unit-test/slang-unit-test.h"

#include "slang-gfx.h"
#include "gfx-test-util.h"
#include "tools/gfx-util/shader-cursor.h"
#include "source/core/slang-basic.h"

using namespace gfx;

namespace gfx_test
{
    void sharedBufferTestImpl(IDevice* srcDevice, IDevice* dstDevice, UnitTestContext* context)
    {
        // Create a shareable buffer using srcDevice, get its handle, then create a buffer using the handle using
        // dstDevice. Read back the buffer and check that its contents are correct.
        const int numberCount = 4;
        float initialData[] = { 0.0f, 1.0f, 2.0f, 3.0f };
        IBufferResource::Desc bufferDesc = {};
        bufferDesc.sizeInBytes = numberCount * sizeof(float);
        bufferDesc.format = gfx::Format::Unknown;
        bufferDesc.elementSize = sizeof(float);
        bufferDesc.allowedStates = ResourceStateSet(
            ResourceState::ShaderResource,
            ResourceState::UnorderedAccess,
            ResourceState::CopyDestination,
            ResourceState::CopySource);
        bufferDesc.defaultState = ResourceState::UnorderedAccess;
        bufferDesc.memoryType = MemoryType::DeviceLocal;
        bufferDesc.isShared = true;

        ComPtr<IBufferResource> srcBuffer;
        GFX_CHECK_CALL_ABORT(srcDevice->createBufferResource(
            bufferDesc,
            (void*)initialData,
            srcBuffer.writeRef()));

        InteropHandle sharedHandle;
        GFX_CHECK_CALL_ABORT(srcBuffer->getSharedHandle(&sharedHandle));
        ComPtr<IBufferResource> dstBuffer;
        GFX_CHECK_CALL_ABORT(dstDevice->createBufferFromSharedHandle(sharedHandle, bufferDesc, dstBuffer.writeRef()));
        // Reading back the buffer from srcDevice to make sure it's been filled in before reading anything back from dstDevice
        // TODO: Implement actual synchronization (and not this hacky solution)
        compareComputeResult(srcDevice, srcBuffer, Slang::makeArray<float>(0.0f, 1.0f, 2.0f, 3.0f));

        InteropHandle testHandle;
        GFX_CHECK_CALL_ABORT(dstBuffer->getNativeResourceHandle(&testHandle));
        IBufferResource::Desc* testDesc = dstBuffer->getDesc();
        SLANG_CHECK(testDesc->elementSize == sizeof(float));
        SLANG_CHECK(testDesc->sizeInBytes == numberCount * sizeof(float));
        compareComputeResult(dstDevice, dstBuffer, Slang::makeArray<float>(0.0f, 1.0f, 2.0f, 3.0f));

        // Check that dstBuffer can be successfully used in a compute dispatch using dstDevice.
        Slang::ComPtr<ITransientResourceHeap> transientHeap;
        ITransientResourceHeap::Desc transientHeapDesc = {};
        transientHeapDesc.constantBufferSize = 4096;
        GFX_CHECK_CALL_ABORT(
            dstDevice->createTransientResourceHeap(transientHeapDesc, transientHeap.writeRef()));

        ComPtr<IShaderProgram> shaderProgram;
        slang::ProgramLayout* slangReflection;
        GFX_CHECK_CALL_ABORT(loadComputeProgram(dstDevice, shaderProgram, "compute-trivial", "computeMain", slangReflection));

        ComputePipelineStateDesc pipelineDesc = {};
        pipelineDesc.program = shaderProgram.get();
        ComPtr<gfx::IPipelineState> pipelineState;
        GFX_CHECK_CALL_ABORT(
            dstDevice->createComputePipelineState(pipelineDesc, pipelineState.writeRef()));

        ComPtr<IResourceView> bufferView;
        IResourceView::Desc viewDesc = {};
        viewDesc.type = IResourceView::Type::UnorderedAccess;
        viewDesc.format = Format::Unknown;
        GFX_CHECK_CALL_ABORT(
            dstDevice->createBufferView(dstBuffer, nullptr, viewDesc, bufferView.writeRef()));

        {
            ICommandQueue::Desc queueDesc = { ICommandQueue::QueueType::Graphics };
            auto queue = dstDevice->createCommandQueue(queueDesc);

            auto commandBuffer = transientHeap->createCommandBuffer();
            auto encoder = commandBuffer->encodeComputeCommands();

            auto rootObject = encoder->bindPipeline(pipelineState);

            ShaderCursor rootCursor(rootObject);
            // Bind buffer view to the entry point.
            rootCursor.getPath("buffer").setResource(bufferView);

            encoder->dispatchCompute(1, 1, 1);
            encoder->endEncoding();
            commandBuffer->close();
            queue->executeCommandBuffer(commandBuffer);
            queue->waitOnHost();
        }

        compareComputeResult(
            dstDevice,
            dstBuffer,
            Slang::makeArray<float>(1.0f, 2.0f, 3.0f, 4.0f));
    }

    void sharedBufferTestAPI(UnitTestContext* context, Slang::RenderApiFlag::Enum srcApi, Slang::RenderApiFlag::Enum dstApi)
    {
        auto srcDevice = createTestingDevice(context, srcApi);
        auto dstDevice = createTestingDevice(context, dstApi);
        if (!srcDevice || !dstDevice)
        {
            SLANG_IGNORE_TEST;
        }

        sharedBufferTestImpl(srcDevice, dstDevice, context);
    }
#if SLANG_WIN64
    SLANG_UNIT_TEST(sharedBufferD3D12ToCUDA)
    {
        sharedBufferTestAPI(unitTestContext, Slang::RenderApiFlag::D3D12, Slang::RenderApiFlag::CUDA);
    }

    SLANG_UNIT_TEST(sharedBufferVulkanToCUDA)
    {
        sharedBufferTestAPI(unitTestContext, Slang::RenderApiFlag::Vulkan, Slang::RenderApiFlag::CUDA);
    }
#endif
}