port from perforce
This commit is contained in:
351
ruins64k/tools/NvPerfUtility/include/NvPerfD3D12.h
Normal file
351
ruins64k/tools/NvPerfUtility/include/NvPerfD3D12.h
Normal file
@@ -0,0 +1,351 @@
|
||||
/*
|
||||
* Copyright 2014-2021 NVIDIA Corporation. All rights reserved.
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#pragma once
|
||||
|
||||
#include "NvPerfInit.h"
|
||||
#include "NvPerfDeviceProperties.h"
|
||||
#include "NvPerfD3D.h"
|
||||
#include "nvperf_d3d12_host.h"
|
||||
#include "nvperf_d3d12_target.h"
|
||||
#include <D3D12.h>
|
||||
#include <atlbase.h>
|
||||
|
||||
namespace nv { namespace perf {
|
||||
|
||||
//
|
||||
// D3D Only Utilities
|
||||
//
|
||||
|
||||
inline bool D3D12FindAdapterForDevice(ID3D12Device* pDevice, IDXGIAdapter1** ppDXGIAdapter, DXGI_ADAPTER_DESC1* pAdapterDesc = nullptr)
|
||||
{
|
||||
const LUID deviceLuid = pDevice->GetAdapterLuid();
|
||||
|
||||
CComPtr<IDXGIFactory1> pDXGIFactory;
|
||||
HRESULT hr = CreateDXGIFactory1(IID_PPV_ARGS(&pDXGIFactory));
|
||||
if (FAILED(hr))
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
for (UINT adapterIndex = 0; ; ++adapterIndex)
|
||||
{
|
||||
CComPtr<IDXGIAdapter1> pDXGIAdapter;
|
||||
hr = pDXGIFactory->EnumAdapters1(adapterIndex, &pDXGIAdapter);
|
||||
if (FAILED(hr))
|
||||
{
|
||||
break; // the intended loop termination
|
||||
}
|
||||
|
||||
DXGI_ADAPTER_DESC1 adapterDesc = {};
|
||||
HRESULT hr = pDXGIAdapter->GetDesc1(&adapterDesc);
|
||||
if (FAILED(hr))
|
||||
{
|
||||
continue;
|
||||
}
|
||||
|
||||
if (!memcmp(&adapterDesc.AdapterLuid, &deviceLuid, sizeof(deviceLuid)))
|
||||
{
|
||||
*ppDXGIAdapter = pDXGIAdapter.Detach();
|
||||
if (pAdapterDesc)
|
||||
{
|
||||
*pAdapterDesc = adapterDesc;
|
||||
}
|
||||
return true;
|
||||
}
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
inline std::wstring D3D12GetDeviceName(ID3D12Device* pDevice)
|
||||
{
|
||||
DXGI_ADAPTER_DESC1 adapterDesc = {};
|
||||
CComPtr<IDXGIAdapter1> pDXGIAdapter;
|
||||
if (!D3D12FindAdapterForDevice(pDevice, &pDXGIAdapter, &adapterDesc))
|
||||
{
|
||||
return L"";
|
||||
}
|
||||
|
||||
return adapterDesc.Description;
|
||||
}
|
||||
|
||||
|
||||
inline bool D3D12IsNvidiaDevice(ID3D12Device* pDevice)
|
||||
{
|
||||
CComPtr<IDXGIAdapter1> pDXGIAdapter;
|
||||
if (!D3D12FindAdapterForDevice(pDevice, &pDXGIAdapter))
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
const bool isNvidiaDevice = DxgiIsNvidiaDevice(pDXGIAdapter);
|
||||
return isNvidiaDevice;
|
||||
}
|
||||
|
||||
inline bool D3D12IsNvidiaDevice(ID3D12CommandQueue* pCommandQueue)
|
||||
{
|
||||
CComPtr<ID3D12Device> pDevice;
|
||||
HRESULT hr = pCommandQueue->GetDevice(IID_PPV_ARGS(&pDevice));
|
||||
if (FAILED(hr))
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
const bool isNvidiaDevice = D3D12IsNvidiaDevice(pDevice);
|
||||
return isNvidiaDevice;
|
||||
}
|
||||
|
||||
//
|
||||
// D3D12 NvPerf Utilities
|
||||
//
|
||||
|
||||
inline bool D3D12LoadDriver()
|
||||
{
|
||||
NVPW_D3D12_LoadDriver_Params loadDriverParams = { NVPW_D3D12_LoadDriver_Params_STRUCT_SIZE };
|
||||
NVPA_Status nvpaStatus = NVPW_D3D12_LoadDriver(&loadDriverParams);
|
||||
if (nvpaStatus)
|
||||
{
|
||||
NV_PERF_LOG_ERR(10, "NVPW_D3D12_LoadDriver failed\n");
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
|
||||
inline size_t D3D12GetNvperfDeviceIndex(ID3D12Device* pDevice, size_t sliIndex = 0)
|
||||
{
|
||||
NVPW_D3D12_Device_GetDeviceIndex_Params getDeviceIndexParams = { NVPW_D3D12_Device_GetDeviceIndex_Params_STRUCT_SIZE };
|
||||
getDeviceIndexParams.pDevice = pDevice;
|
||||
getDeviceIndexParams.sliIndex = sliIndex;
|
||||
NVPA_Status nvpaStatus = NVPW_D3D12_Device_GetDeviceIndex(&getDeviceIndexParams);
|
||||
if (nvpaStatus)
|
||||
{
|
||||
return ~size_t(0);
|
||||
}
|
||||
|
||||
return getDeviceIndexParams.deviceIndex;
|
||||
}
|
||||
|
||||
inline DeviceIdentifiers D3D12GetDeviceIdentifiers(ID3D12Device* pDevice, size_t sliIndex = 0)
|
||||
{
|
||||
CComPtr<IDXGIAdapter1> pDXGIAdapter;
|
||||
if (!D3D12FindAdapterForDevice(pDevice, &pDXGIAdapter))
|
||||
{
|
||||
return {};
|
||||
}
|
||||
|
||||
return D3DGetDeviceIdentifiers(pDXGIAdapter, sliIndex);
|
||||
}
|
||||
|
||||
inline NVPW_Device_ClockStatus D3D12GetDeviceClockState(ID3D12Device* pDevice)
|
||||
{
|
||||
size_t nvperfDeviceIndex = D3D12GetNvperfDeviceIndex(pDevice);
|
||||
return GetDeviceClockState(nvperfDeviceIndex);
|
||||
}
|
||||
|
||||
inline bool D3D12SetDeviceClockState(ID3D12Device* pDevice, NVPW_Device_ClockSetting clockSetting)
|
||||
{
|
||||
size_t nvperfDeviceIndex = D3D12GetNvperfDeviceIndex(pDevice);
|
||||
return SetDeviceClockState(nvperfDeviceIndex, clockSetting);
|
||||
}
|
||||
|
||||
inline bool D3D12SetDeviceClockState(ID3D12Device* pDevice, NVPW_Device_ClockStatus clockStatus)
|
||||
{
|
||||
size_t nvperfDeviceIndex = D3D12GetNvperfDeviceIndex(pDevice);
|
||||
return SetDeviceClockState(nvperfDeviceIndex, clockStatus);
|
||||
}
|
||||
|
||||
inline size_t D3D12CalculateMetricsEvaluatorScratchBufferSize(const char* pChipName)
|
||||
{
|
||||
NVPW_D3D12_MetricsEvaluator_CalculateScratchBufferSize_Params calculateScratchBufferSizeParams = { NVPW_D3D12_MetricsEvaluator_CalculateScratchBufferSize_Params_STRUCT_SIZE };
|
||||
calculateScratchBufferSizeParams.pChipName = pChipName;
|
||||
NVPA_Status nvpaStatus = NVPW_D3D12_MetricsEvaluator_CalculateScratchBufferSize(&calculateScratchBufferSizeParams);
|
||||
if (nvpaStatus)
|
||||
{
|
||||
NV_PERF_LOG_ERR(20, "NVPW_D3D12_MetricsEvaluator_CalculateScratchBufferSize failed\n");
|
||||
return 0;
|
||||
}
|
||||
return calculateScratchBufferSizeParams.scratchBufferSize;
|
||||
}
|
||||
|
||||
inline NVPW_MetricsEvaluator* D3D12CreateMetricsEvaluator(uint8_t* pScratchBuffer, size_t scratchBufferSize, const char* pChipName)
|
||||
{
|
||||
NVPW_D3D12_MetricsEvaluator_Initialize_Params initializeParams = { NVPW_D3D12_MetricsEvaluator_Initialize_Params_STRUCT_SIZE };
|
||||
initializeParams.pScratchBuffer = pScratchBuffer;
|
||||
initializeParams.scratchBufferSize = scratchBufferSize;
|
||||
initializeParams.pChipName = pChipName;
|
||||
NVPA_Status nvpaStatus = NVPW_D3D12_MetricsEvaluator_Initialize(&initializeParams);
|
||||
if (nvpaStatus)
|
||||
{
|
||||
NV_PERF_LOG_ERR(20, "NVPW_D3D12_MetricsEvaluator_Initialize failed\n");
|
||||
return nullptr;
|
||||
}
|
||||
return initializeParams.pMetricsEvaluator;
|
||||
}
|
||||
|
||||
}}
|
||||
|
||||
namespace nv { namespace perf { namespace profiler {
|
||||
|
||||
inline NVPA_RawMetricsConfig* D3D12CreateRawMetricsConfig(const char* pChipName)
|
||||
{
|
||||
NVPW_D3D12_RawMetricsConfig_Create_Params configParams = { NVPW_D3D12_RawMetricsConfig_Create_Params_STRUCT_SIZE };
|
||||
configParams.activityKind = NVPA_ACTIVITY_KIND_PROFILER;
|
||||
configParams.pChipName = pChipName;
|
||||
|
||||
NVPA_Status nvpaStatus = NVPW_D3D12_RawMetricsConfig_Create(&configParams);
|
||||
if (nvpaStatus)
|
||||
{
|
||||
NV_PERF_LOG_ERR(20, "NVPW_D3D12_RawMetricsConfig_Create failed\n");
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
return configParams.pRawMetricsConfig;
|
||||
}
|
||||
|
||||
inline bool D3D12IsGpuSupported(ID3D12Device* pDevice, size_t sliIndex = 0)
|
||||
{
|
||||
const size_t deviceIndex = D3D12GetNvperfDeviceIndex(pDevice, sliIndex);
|
||||
if (deviceIndex == ~size_t(0))
|
||||
{
|
||||
NV_PERF_LOG_ERR(10, "D3D12GetNvperfDeviceIndex failed on %ls\n", D3D12GetDeviceName(pDevice).c_str());
|
||||
return false;
|
||||
}
|
||||
|
||||
NVPW_D3D12_Profiler_IsGpuSupported_Params params = { NVPW_D3D12_Profiler_IsGpuSupported_Params_STRUCT_SIZE };
|
||||
params.deviceIndex = deviceIndex;
|
||||
NVPA_Status nvpaStatus = NVPW_D3D12_Profiler_IsGpuSupported(¶ms);
|
||||
if (nvpaStatus)
|
||||
{
|
||||
NV_PERF_LOG_ERR(10, "NVPW_D3D12_Profiler_IsGpuSupported failed on %ls\n", D3D12GetDeviceName(pDevice).c_str());
|
||||
return false;
|
||||
}
|
||||
|
||||
if (!params.isSupported)
|
||||
{
|
||||
NV_PERF_LOG_ERR(10, "%ls is not supported\n", D3D12GetDeviceName(pDevice).c_str());
|
||||
if (params.gpuArchitectureSupportLevel != NVPW_GPU_ARCHITECTURE_SUPPORT_LEVEL_SUPPORTED)
|
||||
{
|
||||
const DeviceIdentifiers deviceIdentifiers = D3D12GetDeviceIdentifiers(pDevice, sliIndex);
|
||||
NV_PERF_LOG_ERR(10, "Unsupported GPU architecture %s\n", deviceIdentifiers.pChipName);
|
||||
}
|
||||
if (params.sliSupportLevel == NVPW_SLI_SUPPORT_LEVEL_UNSUPPORTED)
|
||||
{
|
||||
NV_PERF_LOG_ERR(10, "Devices in SLI configuration are not supported.\n");
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
inline bool D3D12IsGpuSupported(ID3D12CommandQueue* pCommandQueue, size_t sliIndex = 0)
|
||||
{
|
||||
CComPtr<ID3D12Device> pDevice;
|
||||
HRESULT hr = pCommandQueue->GetDevice(IID_PPV_ARGS(&pDevice));
|
||||
if (FAILED(hr))
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
const bool isGpuSupported = D3D12IsGpuSupported(pDevice, sliIndex);
|
||||
return isGpuSupported;
|
||||
}
|
||||
|
||||
|
||||
inline bool D3D12PushRange(ID3D12GraphicsCommandList* pCommandList, const char* pRangeName)
|
||||
{
|
||||
NVPW_D3D12_Profiler_CommandList_PushRange_Params pushRangeParams = { NVPW_D3D12_Profiler_CommandList_PushRange_Params_STRUCT_SIZE };
|
||||
pushRangeParams.pRangeName = pRangeName;
|
||||
pushRangeParams.rangeNameLength = 0;
|
||||
pushRangeParams.pCommandList = pCommandList;
|
||||
NVPA_Status nvpaStatus = NVPW_D3D12_Profiler_CommandList_PushRange(&pushRangeParams);
|
||||
if (nvpaStatus)
|
||||
{
|
||||
NV_PERF_LOG_ERR(50, "NVPW_D3D12_Profiler_CommandList_PushRange failed\n");
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
inline bool D3D12PopRange(ID3D12GraphicsCommandList* pCommandList)
|
||||
{
|
||||
NVPW_D3D12_Profiler_CommandList_PopRange_Params popParams = { NVPW_D3D12_Profiler_CommandList_PopRange_Params_STRUCT_SIZE };
|
||||
popParams.pCommandList = pCommandList;
|
||||
NVPA_Status nvpaStatus = NVPW_D3D12_Profiler_CommandList_PopRange(&popParams);
|
||||
if (nvpaStatus)
|
||||
{
|
||||
NV_PERF_LOG_ERR(50, "NVPW_D3D12_Profiler_CommandList_PopRange failed\n");
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
inline bool D3D12PushRange_Nop(ID3D12GraphicsCommandList* pCommandList, const char* pRangeName)
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
inline bool D3D12PopRange_Nop(ID3D12GraphicsCommandList* pCommandList)
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
//
|
||||
struct D3D12RangeCommands
|
||||
{
|
||||
bool isNvidiaDevice;
|
||||
bool(*PushRange)(ID3D12GraphicsCommandList* pCommandList, const char* pRangeName);
|
||||
bool(*PopRange)(ID3D12GraphicsCommandList* pCommandList);
|
||||
|
||||
public:
|
||||
D3D12RangeCommands()
|
||||
: isNvidiaDevice(false)
|
||||
, PushRange(&D3D12PushRange_Nop)
|
||||
, PopRange(&D3D12PopRange_Nop)
|
||||
{
|
||||
}
|
||||
|
||||
void Initialize(bool isNvidiaDevice_)
|
||||
{
|
||||
isNvidiaDevice = isNvidiaDevice_;
|
||||
if (isNvidiaDevice_)
|
||||
{
|
||||
PushRange = &D3D12PushRange;
|
||||
PopRange = &D3D12PopRange;
|
||||
}
|
||||
else
|
||||
{
|
||||
PushRange = &D3D12PushRange_Nop;
|
||||
PopRange = &D3D12PopRange_Nop;
|
||||
}
|
||||
}
|
||||
|
||||
void Initialize(IDXGIAdapter* pDXGIAdapter)
|
||||
{
|
||||
const bool isNvidiaDevice_ = DxgiIsNvidiaDevice(pDXGIAdapter);
|
||||
return Initialize(isNvidiaDevice_);
|
||||
}
|
||||
|
||||
void Initialize(ID3D12Device* pDevice)
|
||||
{
|
||||
const bool isNvidiaDevice_ = D3D12IsNvidiaDevice(pDevice);
|
||||
return Initialize(isNvidiaDevice_);
|
||||
}
|
||||
};
|
||||
|
||||
}}}
|
||||
Reference in New Issue
Block a user