summaryrefslogtreecommitdiffstats
path: root/tools/render-test
diff options
context:
space:
mode:
authorGangzheng Tong <tonggangzheng@gmail.com>2025-09-22 15:46:42 -0700
committerGitHub <noreply@github.com>2025-09-22 22:46:42 +0000
commitba8132345cbae5b749b4a01deda732ad6f8251a0 (patch)
treef00ad0dd2d26f49112e430615106c9f6d22de032 /tools/render-test
parentbd24cc271c5d151dbaa7e4da674cbc219aef8153 (diff)
Add RHI Device Caching and Test Prefix Exclusion (#8448)
# Add RHI Device Caching and Test Prefix Exclusion ## Summary This PR introduces two key improvements to the Slang test infrastructure: 1. **RHI Device Caching**: Implements device caching to significantly speed up test execution by reusing graphics devices across tests, **RHI Device Caching reduces slang-test execution time from ~15 minutes to ~5 minutes in Windows release builds** 2. **Test Prefix Exclusion**: Adds `-exclude-prefix` option to skip tests matching specified path prefixes ## Changes ### RHI Device Caching - **New `DeviceCache` class** (`slang-test-device-cache.h/cpp`): Thread-safe device cache with LRU eviction (max 10 devices) - **Cache control option**: `-cache-rhi-device` flag in both `slang-test` and `render-test` - Default: **enabled** in slang-test, **disabled** in render-test when run standalone - Automatically skips caching for CUDA devices (due to driver issues) - **Performance benefit**: Eliminates expensive device creation/destruction cycles, especially beneficial for Vulkan on Tegra platforms ### Test Prefix Exclusion - **New `-exclude-prefix <prefix>` option** in slang-test - Allows excluding entire test directories or patterns from execution - Complements existing `-category` and individual test filtering options ### Usage Examples ```bash # Enable device caching (default) slang-test # Disable device caching slang-test -cache-rhi-device false # Exclude tests from specific directories slang-test -exclude-prefix tests/problematic/ slang-test -exclude-prefix tests/slow/ -exclude-prefix tests/experimental/ ``` This change should significantly improve test execution performance, particularly in CI environments with frequent device operations. This is needed for running the GPU test in aarch64, where repeated device creation/destroy is causing driver issues. Needed by: https://github.com/shader-slang/slang/issues/8346 --------- Co-authored-by: slangbot <ellieh+slangbot@nvidia.com> Co-authored-by: slangbot <186143334+slangbot@users.noreply.github.com>
Diffstat (limited to 'tools/render-test')
-rw-r--r--tools/render-test/options.cpp4
-rw-r--r--tools/render-test/options.h3
-rw-r--r--tools/render-test/render-test-main.cpp45
-rw-r--r--tools/render-test/slang-test-device-cache.cpp160
-rw-r--r--tools/render-test/slang-test-device-cache.h97
5 files changed, 299 insertions, 10 deletions
diff --git a/tools/render-test/options.cpp b/tools/render-test/options.cpp
index 120e03456..0ecda6944 100644
--- a/tools/render-test/options.cpp
+++ b/tools/render-test/options.cpp
@@ -278,6 +278,10 @@ static rhi::DeviceType _toRenderType(Slang::RenderApiType apiType)
{
outOptions.showAdapterInfo = true;
}
+ else if (argValue == "-cache-rhi-device")
+ {
+ outOptions.cacheRhiDevice = true;
+ }
else
{
// Lookup
diff --git a/tools/render-test/options.h b/tools/render-test/options.h
index 49e05c440..bbc2364cd 100644
--- a/tools/render-test/options.h
+++ b/tools/render-test/options.h
@@ -96,6 +96,9 @@ struct Options
bool skipSPIRVValidation = false;
+ // Whether to enable RHI device caching (default: false in render-test)
+ bool cacheRhiDevice = false;
+
Slang::List<Slang::String> capabilities;
Options() { downstreamArgs.addName("slang"); }
diff --git a/tools/render-test/render-test-main.cpp b/tools/render-test/render-test-main.cpp
index 991d60683..5b3974fc9 100644
--- a/tools/render-test/render-test-main.cpp
+++ b/tools/render-test/render-test-main.cpp
@@ -12,6 +12,7 @@
#include "shader-input-layout.h"
#include "shader-renderer-util.h"
#include "slang-support.h"
+#include "slang-test-device-cache.h"
#include "window.h"
#if defined(_WIN32)
@@ -1440,7 +1441,7 @@ static SlangResult _innerMain(
}
}
- renderer_test::CoreToRHIDebugBridge debugCallback;
+ static renderer_test::CoreToRHIDebugBridge debugCallback;
debugCallback.setCoreCallback(stdWriters->getDebugCallback());
// Use the profile name set on options if set
@@ -1495,7 +1496,7 @@ static SlangResult _innerMain(
return SLANG_E_NOT_AVAILABLE;
}
- Slang::ComPtr<IDevice> device;
+ CachedDeviceWrapper deviceWrapper;
{
DeviceDesc desc = {};
desc.deviceType = options.deviceType;
@@ -1558,8 +1559,27 @@ static SlangResult _innerMain(
{
getRHI()->enableDebugLayers();
}
- SlangResult res = getRHI()->createDevice(desc, device.writeRef());
- if (SLANG_FAILED(res))
+ Slang::ComPtr<rhi::IDevice> rhiDevice;
+ SlangResult res;
+ if (options.cacheRhiDevice)
+ {
+ res = DeviceCache::acquireDevice(desc, rhiDevice.writeRef());
+ if (SLANG_FAILED(res))
+ {
+ rhiDevice = nullptr;
+ }
+ }
+ else
+ {
+ res = rhi::getRHI()->createDevice(desc, rhiDevice.writeRef());
+ if (SLANG_FAILED(res))
+ {
+ rhiDevice = nullptr;
+ }
+ }
+
+ // Check result for both cached and non-cached paths
+ if (SLANG_FAILED(res) || !rhiDevice)
{
// We need to be careful here about SLANG_E_NOT_AVAILABLE. This return value means
// that the renderer couldn't be created because it required *features* that were
@@ -1575,21 +1595,20 @@ static SlangResult _innerMain(
{
return res;
}
-
if (!options.onlyStartup)
{
fprintf(stderr, "Unable to create renderer %s\n", rendererName.getBuffer());
}
-
return res;
}
- SLANG_ASSERT(device);
+ SLANG_ASSERT(rhiDevice);
+ deviceWrapper = CachedDeviceWrapper(rhiDevice);
}
for (const auto& feature : requiredFeatureList)
{
// If doesn't have required feature... we have to give up
- if (!device->hasFeature(feature))
+ if (!deviceWrapper->hasFeature(feature))
{
return SLANG_E_NOT_AVAILABLE;
}
@@ -1599,7 +1618,7 @@ static SlangResult _innerMain(
// Print adapter info after device creation but before any other operations
if (options.showAdapterInfo)
{
- auto info = device->getInfo();
+ auto info = deviceWrapper->getInfo();
auto out = stdWriters->getOut();
out.print("Using graphics adapter: %s\n", info.adapterName);
}
@@ -1613,14 +1632,20 @@ static SlangResult _innerMain(
{
RenderTestApp app;
renderDocBeginFrame();
- SLANG_RETURN_ON_FAIL(app.initialize(session, device, options, input));
+ SLANG_RETURN_ON_FAIL(app.initialize(session, deviceWrapper.get(), options, input));
app.update();
renderDocEndFrame();
app.finalize();
}
+
return SLANG_OK;
}
+SLANG_TEST_TOOL_API void cleanDeviceCache()
+{
+ DeviceCache::cleanCache();
+}
+
SLANG_TEST_TOOL_API SlangResult innerMain(
Slang::StdWriters* stdWriters,
SlangSession* sharedSession,
diff --git a/tools/render-test/slang-test-device-cache.cpp b/tools/render-test/slang-test-device-cache.cpp
new file mode 100644
index 000000000..a486ee3f3
--- /dev/null
+++ b/tools/render-test/slang-test-device-cache.cpp
@@ -0,0 +1,160 @@
+#include "slang-test-device-cache.h"
+
+#include <algorithm>
+
+// Static member accessor functions (Meyer's singleton pattern)
+// This ensures proper destruction order - function-local statics are destroyed
+// in reverse order of first access, avoiding the static destruction order fiasco
+std::mutex& DeviceCache::getMutex()
+{
+ static std::mutex instance;
+ return instance;
+}
+
+std::unordered_map<
+ DeviceCache::DeviceCacheKey,
+ DeviceCache::CachedDevice,
+ DeviceCache::DeviceCacheKeyHash>&
+DeviceCache::getDeviceCache()
+{
+ static std::unordered_map<DeviceCacheKey, CachedDevice, DeviceCacheKeyHash> instance;
+ return instance;
+}
+
+uint64_t& DeviceCache::getNextCreationOrder()
+{
+ static uint64_t instance = 0;
+ return instance;
+}
+
+bool DeviceCache::DeviceCacheKey::operator==(const DeviceCacheKey& other) const
+{
+ return deviceType == other.deviceType && enableValidation == other.enableValidation &&
+ enableRayTracingValidation == other.enableRayTracingValidation &&
+ profileName == other.profileName && requiredFeatures == other.requiredFeatures;
+}
+
+std::size_t DeviceCache::DeviceCacheKeyHash::operator()(const DeviceCacheKey& key) const
+{
+ std::size_t h1 = std::hash<int>{}(static_cast<int>(key.deviceType));
+ std::size_t h2 = std::hash<bool>{}(key.enableValidation);
+ std::size_t h3 = std::hash<bool>{}(key.enableRayTracingValidation);
+ std::size_t h4 = std::hash<std::string>{}(key.profileName);
+
+ std::size_t h5 = 0;
+ for (const auto& feature : key.requiredFeatures)
+ {
+ h5 ^= std::hash<std::string>{}(feature) + 0x9e3779b9 + (h5 << 6) + (h5 >> 2);
+ }
+
+ return h1 ^ (h2 << 1) ^ (h3 << 2) ^ (h4 << 3) ^ (h5 << 4);
+}
+
+DeviceCache::CachedDevice::CachedDevice()
+ : creationOrder(0)
+{
+}
+
+void DeviceCache::evictOldestDeviceIfNeeded()
+{
+ auto& deviceCache = getDeviceCache();
+ if (deviceCache.size() < MAX_CACHED_DEVICES)
+ return;
+
+ // Find the oldest device to evict
+ auto oldestIt = deviceCache.end();
+ uint64_t oldestCreationOrder = UINT64_MAX;
+
+ for (auto it = deviceCache.begin(); it != deviceCache.end(); ++it)
+ {
+ if (it->second.creationOrder < oldestCreationOrder)
+ {
+ oldestCreationOrder = it->second.creationOrder;
+ oldestIt = it;
+ }
+ }
+
+ // Remove the oldest device - ComPtr will handle the actual device release
+ if (oldestIt != deviceCache.end())
+ {
+ deviceCache.erase(oldestIt);
+ }
+}
+
+SlangResult DeviceCache::acquireDevice(const rhi::DeviceDesc& desc, rhi::IDevice** outDevice)
+{
+ if (!outDevice)
+ return SLANG_E_INVALID_ARG;
+
+ *outDevice = nullptr;
+
+ // Skip caching for CUDA devices due to crashes
+ if (desc.deviceType == rhi::DeviceType::CUDA)
+ {
+ return rhi::getRHI()->createDevice(desc, outDevice);
+ }
+
+ std::lock_guard<std::mutex> lock(getMutex());
+ auto& deviceCache = getDeviceCache();
+ auto& nextCreationOrder = getNextCreationOrder();
+
+ // Create cache key
+ DeviceCacheKey key;
+ key.deviceType = desc.deviceType;
+ key.enableValidation = desc.enableValidation;
+ key.enableRayTracingValidation = desc.enableRayTracingValidation;
+ key.profileName = desc.slang.targetProfile ? desc.slang.targetProfile : "Unknown";
+
+ // Add required features to key
+ for (int i = 0; i < desc.requiredFeatureCount; ++i)
+ {
+ key.requiredFeatures.push_back(desc.requiredFeatures[i]);
+ }
+ std::sort(key.requiredFeatures.begin(), key.requiredFeatures.end());
+
+ // Evict oldest device if we've reached the limit
+ evictOldestDeviceIfNeeded();
+
+ // Check if we have a cached device
+ auto it = deviceCache.find(key);
+ if (it != deviceCache.end())
+ {
+ // Return the cached device - COM reference counting handles the references
+ *outDevice = it->second.device.get();
+ if (*outDevice)
+ {
+ (*outDevice)->addRef();
+ return SLANG_OK;
+ }
+ }
+
+ // Create new device
+ Slang::ComPtr<rhi::IDevice> device;
+ auto result = rhi::getRHI()->createDevice(desc, device.writeRef());
+ if (SLANG_FAILED(result))
+ {
+ return result;
+ }
+
+ // Cache the device
+ CachedDevice& cached = deviceCache[key];
+ cached.device = device;
+ cached.creationOrder = nextCreationOrder++;
+
+ // Return the device with proper reference counting
+ *outDevice = device.get();
+ if (*outDevice)
+ {
+ (*outDevice)->addRef();
+ }
+
+ return SLANG_OK;
+}
+
+
+void DeviceCache::cleanCache()
+{
+ std::lock_guard<std::mutex> lock(getMutex());
+ auto& deviceCache = getDeviceCache();
+ deviceCache.clear();
+}
diff --git a/tools/render-test/slang-test-device-cache.h b/tools/render-test/slang-test-device-cache.h
new file mode 100644
index 000000000..752d03ff1
--- /dev/null
+++ b/tools/render-test/slang-test-device-cache.h
@@ -0,0 +1,97 @@
+#pragma once
+
+#include <mutex>
+#include <slang-rhi.h>
+#include <string>
+#include <unordered_map>
+#include <vector>
+
+// Device Cache for preventing NVIDIA Tegra driver state corruption
+// This cache reuses Vulkan instances and devices to avoid the VK_ERROR_INCOMPATIBLE_DRIVER
+// issue that occurs after ~19 device creation/destruction cycles on Tegra platforms.
+// Uses ComPtr for automatic device lifecycle management - devices are released when removed from
+// cache.
+class DeviceCache
+{
+public:
+ struct DeviceCacheKey
+ {
+ rhi::DeviceType deviceType;
+ bool enableValidation;
+ bool enableRayTracingValidation;
+ std::string profileName;
+ std::vector<std::string> requiredFeatures;
+
+ bool operator==(const DeviceCacheKey& other) const;
+ };
+
+ struct DeviceCacheKeyHash
+ {
+ std::size_t operator()(const DeviceCacheKey& key) const;
+ };
+
+ struct CachedDevice
+ {
+ Slang::ComPtr<rhi::IDevice> device;
+ uint64_t creationOrder;
+
+ CachedDevice();
+ };
+
+private:
+ static constexpr int MAX_CACHED_DEVICES = 10;
+
+ // Use function-local statics to control destruction order (Meyer's singleton pattern)
+ static std::mutex& getMutex();
+ static std::unordered_map<DeviceCacheKey, CachedDevice, DeviceCacheKeyHash>& getDeviceCache();
+ static uint64_t& getNextCreationOrder();
+
+ static void evictOldestDeviceIfNeeded();
+
+public:
+ static SlangResult acquireDevice(const rhi::DeviceDesc& desc, rhi::IDevice** outDevice);
+ static void cleanCache();
+};
+
+// RAII wrapper for cached devices to ensure proper cleanup
+class CachedDeviceWrapper
+{
+private:
+ Slang::ComPtr<rhi::IDevice> m_device;
+
+public:
+ CachedDeviceWrapper() = default;
+
+ CachedDeviceWrapper(Slang::ComPtr<rhi::IDevice> device)
+ : m_device(device)
+ {
+ }
+
+ ~CachedDeviceWrapper() {}
+
+ // Move constructor
+ CachedDeviceWrapper(CachedDeviceWrapper&& other) noexcept
+ : m_device(std::move(other.m_device))
+ {
+ }
+
+ // Move assignment
+ CachedDeviceWrapper& operator=(CachedDeviceWrapper&& other) noexcept
+ {
+ if (this != &other)
+ {
+ m_device = std::move(other.m_device);
+ }
+ return *this;
+ }
+
+ // Delete copy constructor and assignment
+ CachedDeviceWrapper(const CachedDeviceWrapper&) = delete;
+ CachedDeviceWrapper& operator=(const CachedDeviceWrapper&) = delete;
+
+ rhi::IDevice* get() const { return m_device.get(); }
+ rhi::IDevice* operator->() const { return m_device.get(); }
+ operator bool() const { return m_device != nullptr; }
+
+ Slang::ComPtr<rhi::IDevice>& getComPtr() { return m_device; }
+};