Skip to content

Commit 625e7e0

Browse files
fix: Override timestamp width from KMD
Signed-off-by: Szymon Morek <[email protected]> Source: 7f2b806
1 parent e7e9804 commit 625e7e0

File tree

13 files changed

+97
-0
lines changed

13 files changed

+97
-0
lines changed

shared/source/debug_settings/debug_variables_base.inl

+1
Original file line numberDiff line numberDiff line change
@@ -292,6 +292,7 @@ DECLARE_DEBUG_VARIABLE(int32_t, StandaloneInOrderTimestampAllocationEnabled, -1,
292292
DECLARE_DEBUG_VARIABLE(int32_t, ForceComputeWalkerPostSyncFlushWithWrite, -1, "-1: ignore. >=0: Force PostSync cache flush and override postSync immediate write address to given value")
293293
DECLARE_DEBUG_VARIABLE(int32_t, DeferStateInitSubmissionToFirstRegularUsage, -1, "-1: ignore, 0: disabled, 1: enabled. If set, instead of initializing at Device creation, submit initial state during first usage (eg. kernel submission)")
294294
DECLARE_DEBUG_VARIABLE(int32_t, ForceNonWalkerSplitMemoryCopy, -1, "-1: default, 0: disabled, 1: enabled. If set, memory copy will be executed as single byte copy Walker without performance optimizations")
295+
DECLARE_DEBUG_VARIABLE(int32_t, OverrideTimestampWidth, -1, "-1: default from KMD, > 0: Override timestamp width used for profiling. Requires XeKMD kernel.")
295296

296297
/*LOGGING FLAGS*/
297298
DECLARE_DEBUG_VARIABLE(int32_t, PrintDriverDiagnostics, -1, "prints driver diagnostics messages to standard output, value corresponds to hint level")

shared/source/execution_environment/root_device_environment.cpp

+1
Original file line numberDiff line numberDiff line change
@@ -128,6 +128,7 @@ void RootDeviceEnvironment::initOsTime() {
128128
if (!osTime) {
129129
osTime = OSTime::create(osInterface.get());
130130
osTime->setDeviceTimerResolution(*hwInfo);
131+
osTime->setDeviceTimestampWidth(gfxCoreHelper->getDeviceTimestampWidth());
131132
}
132133
}
133134

shared/source/helpers/gfx_core_helper.h

+4
Original file line numberDiff line numberDiff line change
@@ -200,6 +200,8 @@ class GfxCoreHelper {
200200

201201
virtual bool usmCompressionSupported(const NEO::HardwareInfo &hwInfo) const = 0;
202202

203+
virtual uint32_t getDeviceTimestampWidth() const = 0;
204+
203205
virtual ~GfxCoreHelper() = default;
204206

205207
protected:
@@ -436,6 +438,8 @@ class GfxCoreHelperHw : public GfxCoreHelper {
436438

437439
bool usmCompressionSupported(const NEO::HardwareInfo &hwInfo) const override;
438440

441+
uint32_t getDeviceTimestampWidth() const override;
442+
439443
~GfxCoreHelperHw() override = default;
440444

441445
protected:

shared/source/helpers/gfx_core_helper_base.inl

+8
Original file line numberDiff line numberDiff line change
@@ -801,6 +801,14 @@ bool GfxCoreHelperHw<GfxFamily>::usmCompressionSupported(const NEO::HardwareInfo
801801
return false;
802802
}
803803

804+
template <typename GfxFamily>
805+
uint32_t GfxCoreHelperHw<GfxFamily>::getDeviceTimestampWidth() const {
806+
if (debugManager.flags.OverrideTimestampWidth.get() != -1) {
807+
return debugManager.flags.OverrideTimestampWidth.get();
808+
}
809+
return 0u;
810+
}
811+
804812
template <typename Family>
805813
uint32_t GfxCoreHelperHw<Family>::getInternalCopyEngineIndex(const HardwareInfo &hwInfo) const {
806814
if (debugManager.flags.ForceBCSForInternalCopyEngine.get() != -1) {

shared/source/os_interface/linux/xe/ioctl_helper_xe.cpp

+3
Original file line numberDiff line numberDiff line change
@@ -429,6 +429,9 @@ bool IoctlHelperXe::setGpuCpuTimes(TimeStampData *pGpuCpuTime, OSTime *osTime) {
429429
ret = IoctlHelper::ioctl(DrmIoctl::query, &deviceQuery);
430430

431431
auto nValidBits = queryEngineCycles->width;
432+
if (osTime->getDeviceTimestampWidth() != 0) {
433+
nValidBits = osTime->getDeviceTimestampWidth();
434+
}
432435
auto gpuTimestampValidBits = maxNBitValue(nValidBits);
433436
auto gpuCycles = queryEngineCycles->engine_cycles & gpuTimestampValidBits;
434437

shared/source/os_interface/os_time.h

+9
Original file line numberDiff line numberDiff line change
@@ -86,6 +86,14 @@ class OSTime {
8686
deviceTime->setDeviceTimerResolution(hwInfo);
8787
}
8888

89+
void setDeviceTimestampWidth(uint32_t timestampWidth) {
90+
this->timestampWidth = timestampWidth;
91+
}
92+
93+
uint32_t getDeviceTimestampWidth() const {
94+
return this->timestampWidth;
95+
}
96+
8997
void setRefreshTimestampsFlag() const {
9098
deviceTime->setRefreshTimestampsFlag();
9199
}
@@ -99,5 +107,6 @@ class OSTime {
99107
OSInterface *osInterface = nullptr;
100108
std::unique_ptr<DeviceTime> deviceTime;
101109
uint64_t maxGpuTimeStamp = 0;
110+
uint32_t timestampWidth = 0;
102111
};
103112
} // namespace NEO

shared/source/xe2_hpg_core/gfx_core_helper_xe2_hpg_core.cpp

+8
Original file line numberDiff line numberDiff line change
@@ -332,6 +332,14 @@ uint32_t GfxCoreHelperHw<Family>::getMetricsLibraryGenId() const {
332332
return static_cast<uint32_t>(MetricsLibraryApi::ClientGen::Xe2HPG);
333333
}
334334

335+
template <>
336+
uint32_t GfxCoreHelperHw<Family>::getDeviceTimestampWidth() const {
337+
if (debugManager.flags.OverrideTimestampWidth.get() != -1) {
338+
return debugManager.flags.OverrideTimestampWidth.get();
339+
}
340+
return 64u;
341+
};
342+
335343
} // namespace NEO
336344

337345
namespace NEO {

shared/test/common/test_files/igdrcl.config

+1
Original file line numberDiff line numberDiff line change
@@ -626,4 +626,5 @@ DirectSubmissionPrintSemaphoreUsage = -1
626626
ForceNonCoherentModeForTimestamps = 0
627627
ExperimentalUSMAllocationReuseVersion = -1
628628
ForceNonWalkerSplitMemoryCopy = -1
629+
OverrideTimestampWidth = -1
629630
# Please don't edit below this line

shared/test/unit_test/helpers/gfx_core_helper_tests.cpp

+10
Original file line numberDiff line numberDiff line change
@@ -1856,3 +1856,13 @@ HWTEST_F(GfxCoreHelperTest, whenEncodeAdditionalTimestampOffsetsThenNothingEncod
18561856
GenCmdList storeRegMemList = hwParser.getCommandsList<MI_STORE_REGISTER_MEM>();
18571857
EXPECT_EQ(0u, storeRegMemList.size());
18581858
}
1859+
1860+
HWTEST_F(GfxCoreHelperTest, givenGetDeviceTimestampWidthCalledThenReturnCorrectValue) {
1861+
DebugManagerStateRestore restore;
1862+
1863+
auto &helper = getHelper<GfxCoreHelper>();
1864+
EXPECT_EQ(0u, helper.getDeviceTimestampWidth());
1865+
1866+
debugManager.flags.OverrideTimestampWidth.set(64);
1867+
EXPECT_EQ(64u, helper.getDeviceTimestampWidth());
1868+
}

shared/test/unit_test/os_interface/linux/xe/ioctl_helper_xe_tests.cpp

+29
Original file line numberDiff line numberDiff line change
@@ -1793,6 +1793,35 @@ TEST(IoctlHelperXeTest, givenIoctlFailureWhenSetGpuCpuTimesIsCalledThenProperVal
17931793
EXPECT_EQ(pGpuCpuTime.cpuTimeinNS, expectedTimestamp);
17941794
}
17951795

1796+
TEST(IoctlHelperXeTest, whenDeviceTimestampWidthSetThenProperValuesAreSet) {
1797+
DebugManagerStateRestore restorer;
1798+
auto executionEnvironment = std::make_unique<MockExecutionEnvironment>();
1799+
auto &rootDeviceEnvironment = *executionEnvironment->rootDeviceEnvironments[0];
1800+
rootDeviceEnvironment.osInterface = std::make_unique<OSInterface>();
1801+
rootDeviceEnvironment.osInterface->setDriverModel(std::make_unique<DrmMockTime>(mockFd, rootDeviceEnvironment));
1802+
auto drm = DrmMockXe::create(rootDeviceEnvironment);
1803+
auto xeIoctlHelper = static_cast<MockIoctlHelperXe *>(drm->getIoctlHelper());
1804+
auto engineInfo = xeIoctlHelper->createEngineInfo(false);
1805+
ASSERT_NE(nullptr, engineInfo);
1806+
1807+
uint64_t expectedCycles = maxNBitValue(64);
1808+
auto xeQueryEngineCycles = reinterpret_cast<drm_xe_query_engine_cycles *>(drm->queryEngineCycles);
1809+
xeQueryEngineCycles->width = 32;
1810+
xeQueryEngineCycles->engine_cycles = expectedCycles;
1811+
xeQueryEngineCycles->cpu_timestamp = 100;
1812+
1813+
TimeStampData pGpuCpuTime{};
1814+
std::unique_ptr<MockOSTimeLinux> osTime = MockOSTimeLinux::create(*rootDeviceEnvironment.osInterface);
1815+
auto ret = xeIoctlHelper->setGpuCpuTimes(&pGpuCpuTime, osTime.get());
1816+
EXPECT_EQ(true, ret);
1817+
1818+
EXPECT_EQ(pGpuCpuTime.gpuTimeStamp, expectedCycles & maxNBitValue(32));
1819+
osTime->setDeviceTimestampWidth(64);
1820+
ret = xeIoctlHelper->setGpuCpuTimes(&pGpuCpuTime, osTime.get());
1821+
EXPECT_EQ(true, ret);
1822+
EXPECT_EQ(pGpuCpuTime.gpuTimeStamp, expectedCycles);
1823+
}
1824+
17961825
TEST(IoctlHelperXeTest, whenSetDefaultEngineIsCalledThenProperEngineIsSet) {
17971826
NEO::HardwareInfo hwInfo = *NEO::defaultHwInfo.get();
17981827
auto executionEnvironment = std::make_unique<MockExecutionEnvironment>(&hwInfo);

shared/test/unit_test/xe2_hpg_core/bmg/gfx_core_helper_tests_bmg.cpp

+11
Original file line numberDiff line numberDiff line change
@@ -44,3 +44,14 @@ BMGTEST_F(GfxCoreHelperTestsBmg, WhenAskingForDcFlushThenReturnFalse) {
4444
setUpImpl();
4545
EXPECT_FALSE(MemorySynchronizationCommands<FamilyType>::getDcFlushEnable(true, pDevice->getRootDeviceEnvironment()));
4646
}
47+
48+
BMGTEST_F(GfxCoreHelperTestsBmg, givenGetDeviceTimestampWidthCalledThenReturnCorrectValue) {
49+
setUpImpl();
50+
DebugManagerStateRestore restore;
51+
52+
auto &helper = this->pDevice->getGfxCoreHelper();
53+
EXPECT_EQ(64u, helper.getDeviceTimestampWidth());
54+
55+
debugManager.flags.OverrideTimestampWidth.set(36);
56+
EXPECT_EQ(36u, helper.getDeviceTimestampWidth());
57+
}

shared/test/unit_test/xe2_hpg_core/excludes_xe2_hpg_core.cpp

+1
Original file line numberDiff line numberDiff line change
@@ -37,3 +37,4 @@ HWTEST_EXCLUDE_PRODUCT(ProductHelperTest, givenBooleanUncachedWhenCallOverridePa
3737
HWTEST_EXCLUDE_PRODUCT(GfxCoreHelperTest, whenEncodeAdditionalTimestampOffsetsThenNothingEncoded, IGFX_XE2_HPG_CORE);
3838
HWTEST_EXCLUDE_PRODUCT(ProductHelperTest, givenProductHelperWhenGetThreadEuRatioForScratchThen8IsReturned, IGFX_XE2_HPG_CORE);
3939
HWTEST_EXCLUDE_PRODUCT(CompilerProductHelperFixture, WhenIsMidThreadPreemptionIsSupportedIsCalledThenCorrectResultIsReturned, IGFX_XE2_HPG_CORE);
40+
HWTEST_EXCLUDE_PRODUCT(GfxCoreHelperTest, givenGetDeviceTimestampWidthCalledThenReturnCorrectValue, IGFX_XE2_HPG_CORE);

shared/test/unit_test/xe2_hpg_core/lnl/gfx_core_helper_tests_lnl.cpp

+11
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,7 @@
99
#include "shared/source/os_interface/product_helper.h"
1010
#include "shared/source/xe2_hpg_core/hw_cmds_lnl.h"
1111
#include "shared/source/xe2_hpg_core/hw_info_lnl.h"
12+
#include "shared/test/common/helpers/debug_manager_state_restore.h"
1213
#include "shared/test/common/helpers/default_hw_info.h"
1314
#include "shared/test/common/helpers/gfx_core_helper_tests.h"
1415
#include "shared/test/common/mocks/mock_device.h"
@@ -31,3 +32,13 @@ LNLTEST_F(GfxCoreHelperTestsLnl, givenCommandBufferAllocationTypeWhenGetAllocati
3132
LNLTEST_F(GfxCoreHelperTestsLnl, WhenAskingForDcFlushThenReturnTrue) {
3233
EXPECT_NE(MemorySynchronizationCommands<FamilyType>::getDcFlushEnable(true, this->pDevice->getRootDeviceEnvironment()), this->pDevice->getRootDeviceEnvironment().getProductHelper().isDcFlushMitigated());
3334
}
35+
36+
LNLTEST_F(GfxCoreHelperTestsLnl, givenGetDeviceTimestampWidthCalledThenReturnCorrectValue) {
37+
DebugManagerStateRestore restore;
38+
39+
auto &helper = this->pDevice->getGfxCoreHelper();
40+
EXPECT_EQ(64u, helper.getDeviceTimestampWidth());
41+
42+
debugManager.flags.OverrideTimestampWidth.set(36);
43+
EXPECT_EQ(36u, helper.getDeviceTimestampWidth());
44+
}

0 commit comments

Comments
 (0)