Skip to content

Commit e1c7124

Browse files
authored
Fix driver sorting given driver failures and instrumentation (#288)
* Fix driver sorting given driver failures and instrumentation - To avoid issues when sorting of the drivers can cause an invalid call during instrumentation after driver failures, then the driver sorting has been moved to occur during the call to zeDriverGet or zeinitDrivers. - In addition, the driver type is not init to UINT32_MAX in the enum such that all failing drivers are forced to the back of the sorted list. Signed-off-by: Neil R. Spruit <[email protected]> * Create recursion guard and check for sorting only once Signed-off-by: Neil R. Spruit <[email protected]> * Disable sorting given program instrumentation is enabled Signed-off-by: Neil R. Spruit <[email protected]> * Updated documentation on limitations of the sorting support Signed-off-by: Neil R. Spruit <[email protected]> * Sort all drivers regardless of the flags set by the user to ensure sorting once Signed-off-by: Neil R. Spruit <[email protected]> * Update loader internal header template with changes Signed-off-by: Neil R. Spruit <[email protected]> --------- Signed-off-by: Neil R. Spruit <[email protected]>
1 parent 928a993 commit e1c7124

10 files changed

+209
-141
lines changed

CHANGELOG.md

+2
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,7 @@
11
# Level zero loader changelog
22

3+
## v1.21.2
4+
* Fix driver sorting given driver failures and instrumentation
35
## v1.21.1
46
* Fix stype assignment in zello_world
57
* Given static Loader, allocate lib context_t always as dynamic and enable delayed destroy of context

CMakeLists.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ if(MSVC AND (MSVC_VERSION LESS 1900))
1313
endif()
1414

1515
# This project follows semantic versioning (https://semver.org/)
16-
project(level-zero VERSION 1.21.1)
16+
project(level-zero VERSION 1.21.2)
1717

1818
include(GNUInstallDirs)
1919

README.md

+1
Original file line numberDiff line numberDiff line change
@@ -109,6 +109,7 @@ The ordering of the drivers reported to the user is based on the order of the en
109109
When additional driver types are added, they should be added to the end of the list to avoid reporting new device types
110110
before known device types.
111111

112+
NOTE: Due to known issues with Program Instrumentation usecases, when ZET_ENABLE_PROGRAM_INSTRUMENTATION is enabled, driver sorting is not possible in the loader.
112113

113114
# Contributing
114115

scripts/templates/ldrddi.cpp.mako

+19
Original file line numberDiff line numberDiff line change
@@ -59,6 +59,25 @@ namespace loader
5959
%elif re.match(r"\w+DriverGet$", th.make_func_name(n, tags, obj)) or re.match(r"\w+InitDrivers$", th.make_func_name(n, tags, obj)):
6060
uint32_t total_driver_handle_count = 0;
6161

62+
if (!loader::context->sortingInProgress.exchange(true) && !loader::context->instrumentationEnabled) {
63+
%if namespace != "zes":
64+
%if not re.match(r"\w+InitDrivers$", th.make_func_name(n, tags, obj)):
65+
std::call_once(loader::context->coreDriverSortOnce, []() {
66+
loader::context->driverSorting(&loader::context->zeDrivers, nullptr);
67+
});
68+
%else:
69+
std::call_once(loader::context->coreDriverSortOnce, [desc]() {
70+
loader::context->driverSorting(&loader::context->zeDrivers, desc);
71+
});
72+
%endif
73+
%else:
74+
std::call_once(loader::context->sysmanDriverSortOnce, []() {
75+
loader::context->driverSorting(loader::context->sysmanInstanceDrivers, nullptr);
76+
});
77+
%endif
78+
loader::context->sortingInProgress.store(false);
79+
}
80+
6281
%if namespace != "zes":
6382
for( auto& drv : loader::context->zeDrivers )
6483
%else:

scripts/templates/ze_loader_internal.h.mako

+6-1
Original file line numberDiff line numberDiff line change
@@ -61,7 +61,7 @@ namespace loader
6161
dditable_t dditable = {};
6262
std::string name;
6363
bool driverInuse = false;
64-
zel_driver_type_t driverType;
64+
zel_driver_type_t driverType = ZEL_DRIVER_TYPE_FORCE_UINT32;
6565
ze_driver_properties_t properties;
6666
bool pciOrderingRequested = false;
6767
};
@@ -111,10 +111,15 @@ namespace loader
111111
ze_result_t init();
112112
ze_result_t init_driver(driver_t &driver, ze_init_flags_t flags, ze_init_driver_type_desc_t* desc, ze_global_dditable_t *globalInitStored, zes_global_dditable_t *sysmanGlobalInitStored, bool sysmanOnly);
113113
void add_loader_version();
114+
bool driverSorting(driver_vector_t *drivers, ze_init_driver_type_desc_t* desc);
114115
~context_t();
115116
bool intercept_enabled = false;
116117
bool debugTraceEnabled = false;
117118
bool tracingLayerEnabled = false;
119+
std::once_flag coreDriverSortOnce;
120+
std::once_flag sysmanDriverSortOnce;
121+
std::atomic<bool> sortingInProgress = {false};
122+
bool instrumentationEnabled = false;
118123
dditable_t tracing_dditable = {};
119124
std::shared_ptr<Logger> zel_logger;
120125
};

source/drivers/null/ze_null.cpp

+5
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,7 @@
88
*
99
*/
1010
#include "ze_null.h"
11+
#include <cstring>
1112

1213
namespace driver
1314
{
@@ -138,6 +139,10 @@ namespace driver
138139
ze_device_properties_t deviceProperties = {};
139140
deviceProperties.stype = ZE_STRUCTURE_TYPE_DEVICE_PROPERTIES;
140141
deviceProperties.type = ZE_DEVICE_TYPE_GPU;
142+
auto driver_type = getenv_string( "ZEL_TEST_NULL_DRIVER_TYPE" );
143+
if (std::strcmp(driver_type.c_str(), "NPU") == 0) {
144+
deviceProperties.type = ZE_DEVICE_TYPE_VPU;
145+
}
141146
#if defined(_WIN32)
142147
strcpy_s( deviceProperties.name, "Null Device" );
143148
#else

source/loader/ze_ldrddi.cpp

+14
Original file line numberDiff line numberDiff line change
@@ -55,6 +55,13 @@ namespace loader
5555

5656
uint32_t total_driver_handle_count = 0;
5757

58+
if (!loader::context->sortingInProgress.exchange(true) && !loader::context->instrumentationEnabled) {
59+
std::call_once(loader::context->coreDriverSortOnce, []() {
60+
loader::context->driverSorting(&loader::context->zeDrivers, nullptr);
61+
});
62+
loader::context->sortingInProgress.store(false);
63+
}
64+
5865
for( auto& drv : loader::context->zeDrivers )
5966
{
6067
if(drv.initStatus != ZE_RESULT_SUCCESS)
@@ -131,6 +138,13 @@ namespace loader
131138

132139
uint32_t total_driver_handle_count = 0;
133140

141+
if (!loader::context->sortingInProgress.exchange(true) && !loader::context->instrumentationEnabled) {
142+
std::call_once(loader::context->coreDriverSortOnce, [desc]() {
143+
loader::context->driverSorting(&loader::context->zeDrivers, desc);
144+
});
145+
loader::context->sortingInProgress.store(false);
146+
}
147+
134148
for( auto& drv : loader::context->zeDrivers )
135149
{
136150
if (!drv.dditable.ze.Global.pfnInitDrivers) {

0 commit comments

Comments
 (0)