From 4dab89db681ed462a4f0a2de61f52516d1fec724 Mon Sep 17 00:00:00 2001 From: Gail Lyons Date: Tue, 30 Jun 2020 12:53:32 -0700 Subject: [PATCH 1/9] [SYCL] Changed sycl::backend::level0 to sycl::backend::level_zero Signed-off-by: Gail Lyons --- sycl/include/CL/sycl/backend_types.hpp | 4 ++-- sycl/source/detail/config.hpp | 6 +++--- sycl/source/detail/pi.cpp | 2 +- sycl/source/detail/program_manager/program_manager.cpp | 2 +- sycl/test/basic_tests/get_backend.cpp | 3 +-- sycl/unittests/pi/BackendString.hpp | 2 +- 6 files changed, 9 insertions(+), 10 deletions(-) diff --git a/sycl/include/CL/sycl/backend_types.hpp b/sycl/include/CL/sycl/backend_types.hpp index 362c6d9d9b5b9..655bbf89d8d39 100644 --- a/sycl/include/CL/sycl/backend_types.hpp +++ b/sycl/include/CL/sycl/backend_types.hpp @@ -18,7 +18,7 @@ __SYCL_INLINE_NAMESPACE(cl) { namespace sycl { -enum class backend : char { host, opencl, level0, cuda }; +enum class backend : char { host, opencl, level_zero, cuda }; template struct interop; @@ -30,7 +30,7 @@ inline std::ostream &operator<<(std::ostream &Out, backend be) { case backend::opencl: Out << std::string("opencl"); break; - case backend::level0: + case backend::level_zero: Out << std::string("level-zero"); break; case backend::cuda: diff --git a/sycl/source/detail/config.hpp b/sycl/source/detail/config.hpp index 1559f40e5ad86..f19816e8995e4 100644 --- a/sycl/source/detail/config.hpp +++ b/sycl/source/detail/config.hpp @@ -120,7 +120,7 @@ template <> class SYCLConfig { const char *ValStr = BaseT::getRawValue(); const std::array, 3> SyclBeMap = { {{"PI_OPENCL", backend::opencl}, - {"PI_LEVEL0", backend::level0}, + {"PI_LEVEL0", backend::level_zero}, {"PI_CUDA", backend::cuda}}}; if (ValStr) { auto It = std::find_if( @@ -161,6 +161,6 @@ template <> class SYCLConfig { } }; -} // __SYCL_INLINE_NAMESPACE(cl) -} // namespace sycl } // namespace detail +} // namespace sycl +} // __SYCL_INLINE_NAMESPACE(cl) diff --git a/sycl/source/detail/pi.cpp b/sycl/source/detail/pi.cpp index b00844cf85a59..786f61416d2e0 100644 --- a/sycl/source/detail/pi.cpp +++ b/sycl/source/detail/pi.cpp @@ -215,7 +215,7 @@ bool findPlugins(vector_class> &PluginNames) { // env only. // PluginNames.emplace_back(OPENCL_PLUGIN_NAME, backend::opencl); - PluginNames.emplace_back(LEVEL0_PLUGIN_NAME, backend::level0); + PluginNames.emplace_back(LEVEL0_PLUGIN_NAME, backend::level_zero); PluginNames.emplace_back(CUDA_PLUGIN_NAME, backend::cuda); return true; } diff --git a/sycl/source/detail/program_manager/program_manager.cpp b/sycl/source/detail/program_manager/program_manager.cpp index 1d788a9bbc1fb..77a7153ce0af2 100644 --- a/sycl/source/detail/program_manager/program_manager.cpp +++ b/sycl/source/detail/program_manager/program_manager.cpp @@ -766,7 +766,7 @@ ProgramManager::build(ProgramPtr Program, const ContextImplPtr Context, // is built during piProgramCreate. // TODO: remove this check as soon as piProgramCompile/piProgramLink will be // implemented in L0 plugin. - if (Context->getPlugin().getBackend() == backend::level0) { + if (Context->getPlugin().getBackend() == backend::level_zero) { LinkDeviceLibs = false; } diff --git a/sycl/test/basic_tests/get_backend.cpp b/sycl/test/basic_tests/get_backend.cpp index de0738dd88341..a312304e0741b 100644 --- a/sycl/test/basic_tests/get_backend.cpp +++ b/sycl/test/basic_tests/get_backend.cpp @@ -3,7 +3,6 @@ // //==----------------- get_backend.cpp ------------------------==// // This is a test of get_backend(). -// Also prints handy info about the system. // Do not set SYCL_BE. We do not want the preferred backend. //==----------------------------------------------------------==// @@ -16,7 +15,7 @@ using namespace cl::sycl; bool check(backend be) { switch (be) { case backend::opencl: - case backend::level0: + case backend::level_zero: case backend::cuda: case backend::host: return true; diff --git a/sycl/unittests/pi/BackendString.hpp b/sycl/unittests/pi/BackendString.hpp index cea0eee8b8338..7f051f5ab6790 100644 --- a/sycl/unittests/pi/BackendString.hpp +++ b/sycl/unittests/pi/BackendString.hpp @@ -15,7 +15,7 @@ inline const char *GetBackendString(cl::sycl::backend backend) { PI_BACKEND_STR(cuda); PI_BACKEND_STR(host); PI_BACKEND_STR(opencl); - PI_BACKEND_STR(level0); + PI_BACKEND_STR(level_zero); #undef PI_BACKEND_STR default: return "Unknown Plugin"; From 9bf0ce17d72635fa02177d3a0563c5ea1050200c Mon Sep 17 00:00:00 2001 From: Gail Lyons Date: Mon, 13 Jul 2020 12:02:09 -0700 Subject: [PATCH 2/9] Changed level0 -> level_zero. SYCL_BE PI_LEVEL0 is now PI_LEVEL_ZERO. PI_LEVEL0 is still accepted and handled correctly. cl::sycl::backend::level0 is now cl::sycl::backend::level_zero. Signed-off-by: Gail Lyons --- sycl/CMakeLists.txt | 2 +- sycl/doc/EnvironmentVariables.md | 4 +- sycl/include/CL/sycl/detail/pi.hpp | 4 +- sycl/plugins/level_zero/CMakeLists.txt | 30 ++--- .../{pi_level0.cpp => pi_level_zero.cpp} | 124 +++++++++--------- .../{pi_level0.hpp => pi_level_zero.hpp} | 52 ++++---- sycl/source/detail/config.hpp | 9 +- sycl/source/detail/pi.cpp | 2 +- .../program_manager/program_manager.cpp | 4 +- sycl/test/CMakeLists.txt | 6 +- ...k.dump => pi_level_zero_symbol_check.dump} | 3 +- sycl/test/basic_tests/buffer/reinterpret.cpp | 2 +- .../image_accessor_readsampler.cpp | 2 +- .../basic_tests/image_accessor_readwrite.cpp | 2 +- .../image_accessor_readwrite_half.cpp | 2 +- sycl/test/basic_tests/kernel_info.cpp | 4 +- .../basic_tests/parallel_for_indexers.cpp | 2 +- sycl/test/basic_tests/parallel_for_range.cpp | 2 +- .../host-task-dependency.cpp | 2 +- .../host-task-two-queues.cpp | 2 +- sycl/test/host-interop-task/interop-task.cpp | 2 +- sycl/test/lit.cfg.py | 16 +-- sycl/test/regression/fsycl-save-temps.cpp | 4 +- sycl/test/regression/image_access.cpp | 4 +- sycl/test/regression/static-buffer-dtor.cpp | 2 +- sycl/test/spec_const/spec_const_hw.cpp | 2 +- sycl/test/spec_const/spec_const_neg.cpp | 2 +- sycl/test/spec_const/spec_const_redefine.cpp | 2 +- sycl/test/usm/allocator_vector.cpp | 2 +- sycl/tools/get_device_count_by_type.cpp | 4 +- 30 files changed, 152 insertions(+), 148 deletions(-) rename sycl/plugins/level_zero/{pi_level0.cpp => pi_level_zero.cpp} (97%) rename sycl/plugins/level_zero/{pi_level0.hpp => pi_level_zero.hpp} (89%) rename sycl/test/abi/{pi_level0_symbol_check.dump => pi_level_zero_symbol_check.dump} (98%) diff --git a/sycl/CMakeLists.txt b/sycl/CMakeLists.txt index c87834185879d..db0b2248e42ce 100644 --- a/sycl/CMakeLists.txt +++ b/sycl/CMakeLists.txt @@ -352,7 +352,7 @@ set( SYCL_TOOLCHAIN_DEPLOY_COMPONENTS sycl-headers-extras sycl pi_opencl - pi_level0 + pi_level_zero libsycldevice ) if(OpenCL_INSTALL_KHRONOS_ICD_LOADER AND TARGET ocl-icd) diff --git a/sycl/doc/EnvironmentVariables.md b/sycl/doc/EnvironmentVariables.md index 3d8d5cb41f741..b353135ecb9db 100644 --- a/sycl/doc/EnvironmentVariables.md +++ b/sycl/doc/EnvironmentVariables.md @@ -1,6 +1,6 @@ # Environment Variables -This document describes environment variables that are having effect on DPC++ +This document describes environment variables that are having effect on DPC++ compiler and runtime. ## Controlling DPC++ RT @@ -12,7 +12,7 @@ subject to change. Do not rely on these variables in production code. | Environment variable | Values | Description | | -------------------- | ------ | ----------- | | SYCL_PI_TRACE | Described [below](#sycl_pi_trace-options) | Enable specified level of tracing for PI. | -| SYCL_BE | PI_OPENCL, PI_LEVEL0, PI_CUDA | Force SYCL RT to consider only devices of the specified backend during the device selection. | +| SYCL_BE | PI_OPENCL, PI_LEVEL_ZERO, PI_CUDA | Force SYCL RT to consider only devices of the specified backend during the device selection. | | SYCL_DEVICE_TYPE | One of: CPU, GPU, ACC, HOST | Force SYCL to use the specified device type. If unset, default selection rules are applied. If set to any unlisted value, this control has no effect. If the requested device type is not found, a `cl::sycl::runtime_error` exception is thrown. If a non-default device selector is used, a device must satisfy both the selector and this control to be chosen. This control only has effect on devices created with a selector. | | SYCL_PROGRAM_COMPILE_OPTIONS | String of valid OpenCL compile options | Override compile options for all programs. | | SYCL_PROGRAM_LINK_OPTIONS | String of valid OpenCL link options | Override link options for all programs. | diff --git a/sycl/include/CL/sycl/detail/pi.hpp b/sycl/include/CL/sycl/detail/pi.hpp index 5ff6e6312df36..8702bc3a8be11 100644 --- a/sycl/include/CL/sycl/detail/pi.hpp +++ b/sycl/include/CL/sycl/detail/pi.hpp @@ -57,11 +57,11 @@ bool trace(TraceLevel level); #ifdef SYCL_RT_OS_WINDOWS #define OPENCL_PLUGIN_NAME "pi_opencl.dll" -#define LEVEL0_PLUGIN_NAME "pi_level0.dll" +#define LEVEL_ZERO_PLUGIN_NAME "pi_level_zero.dll" #define CUDA_PLUGIN_NAME "pi_cuda.dll" #else #define OPENCL_PLUGIN_NAME "libpi_opencl.so" -#define LEVEL0_PLUGIN_NAME "libpi_level0.so" +#define LEVEL_ZERO_PLUGIN_NAME "libpi_level_zero.so" #define CUDA_PLUGIN_NAME "libpi_cuda.so" #endif diff --git a/sycl/plugins/level_zero/CMakeLists.txt b/sycl/plugins/level_zero/CMakeLists.txt index bc75ae3ecee9c..dd7b7efffb1f3 100755 --- a/sycl/plugins/level_zero/CMakeLists.txt +++ b/sycl/plugins/level_zero/CMakeLists.txt @@ -1,4 +1,4 @@ -# PI Level0 plugin library +# PI Level Zero plugin library if(MSVC) set(L0_LOADER @@ -66,20 +66,20 @@ target_include_directories(L0Loader-Headers include_directories("${sycl_inc_dir}") include_directories(${OPENCL_INCLUDE}) -add_library(pi_level0 SHARED +add_library(pi_level_zero SHARED "${sycl_inc_dir}/CL/sycl/detail/pi.h" - "${CMAKE_CURRENT_SOURCE_DIR}/pi_level0.cpp" - "${CMAKE_CURRENT_SOURCE_DIR}/pi_level0.hpp" + "${CMAKE_CURRENT_SOURCE_DIR}/pi_level_zero.cpp" + "${CMAKE_CURRENT_SOURCE_DIR}/pi_level_zero.hpp" ) if (MSVC) # by defining __SYCL_BUILD_SYCL_DLL, we can use __declspec(dllexport) # which are individually tagged for all pi* symbols in pi.h - target_compile_definitions(pi_level0 PRIVATE __SYCL_BUILD_SYCL_DLL) + target_compile_definitions(pi_level_zero PRIVATE __SYCL_BUILD_SYCL_DLL) else() # we set the visibility of all symbols 'hidden' by default. # In pi.h file, we set exported symbols with visibility==default individually - target_compile_options(pi_level0 PUBLIC -fvisibility=hidden) + target_compile_options(pi_level_zero PUBLIC -fvisibility=hidden) # This script file is used to allow exporting pi* symbols only. # All other symbols are regarded as local (hidden) @@ -87,23 +87,23 @@ else() # Filter symbols based on the scope defined in the script file, # and export pi* function symbols in the library. - target_link_libraries( pi_level0 + target_link_libraries( pi_level_zero PRIVATE "-Wl,--version-script=${linker_script}" ) endif() if (TARGET l0-loader) - add_dependencies(pi_level0 l0-loader) + add_dependencies(pi_level_zero l0-loader) endif() - add_dependencies(sycl-toolchain pi_level0) + add_dependencies(sycl-toolchain pi_level_zero) - target_link_libraries(pi_level0 PRIVATE "${L0_LOADER}") + target_link_libraries(pi_level_zero PRIVATE "${L0_LOADER}") if (UNIX) - target_link_libraries(pi_level0 PRIVATE pthread) + target_link_libraries(pi_level_zero PRIVATE pthread) endif() -add_common_options(pi_level0) +add_common_options(pi_level_zero) -install(TARGETS pi_level0 - LIBRARY DESTINATION "lib" COMPONENT pi_level0 - RUNTIME DESTINATION "bin" COMPONENT pi_level0) +install(TARGETS pi_level_zero + LIBRARY DESTINATION "lib" COMPONENT pi_level_zero + RUNTIME DESTINATION "bin" COMPONENT pi_level_zero) diff --git a/sycl/plugins/level_zero/pi_level0.cpp b/sycl/plugins/level_zero/pi_level_zero.cpp similarity index 97% rename from sycl/plugins/level_zero/pi_level0.cpp rename to sycl/plugins/level_zero/pi_level_zero.cpp index dc4ccfd988ca9..72fb03d8cd90e 100644 --- a/sycl/plugins/level_zero/pi_level0.cpp +++ b/sycl/plugins/level_zero/pi_level_zero.cpp @@ -1,4 +1,4 @@ -//===----------- pi_level0.cpp - Level Zero Plugin--------------------------==// +//===----------- pi_level_zero.cpp - Level Zero Plugin--------------------------==// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. @@ -6,12 +6,12 @@ // //===----------------------------------------------------------------------===// -/// \file pi_level0.cpp +/// \file pi_level_zero.cpp /// Implementation of Level Zero Plugin. /// -/// \ingroup sycl_pi_level0 +/// \ingroup sycl_pi_level_zero -#include "pi_level0.hpp" +#include "pi_level_zero.hpp" #include #include #include @@ -25,7 +25,7 @@ namespace { -// Controls L0 calls serialization to w/a L0 driver being not MT ready. +// Controls Level Zero calls serialization to w/a Level Zero driver being not MT ready. // Recognized values (can be used as a bit mask): enum { ZeSerializeNone = @@ -36,10 +36,10 @@ enum { }; static pi_uint32 ZeSerialize = 0; -// This class encapsulates actions taken along with a call to L0 API. +// This class encapsulates actions taken along with a call to Level Zero API. class ZeCall { private: - // The global mutex that is used for total serialization of L0 calls. + // The global mutex that is used for total serialization of Level Zero calls. static std::mutex GlobalLock; public: @@ -60,7 +60,7 @@ class ZeCall { }; std::mutex ZeCall::GlobalLock; -// Controls L0 calls tracing in zePrint. +// Controls Level Zero calls tracing in zePrint. static bool ZeDebug = false; static void zePrint(const char *Format, ...) { @@ -232,12 +232,12 @@ _pi_context::decrementAliveEventsInPool(ze_event_pool_handle_t ZePool) { return ZE_RESULT_SUCCESS; } -// Some opencl extensions we know are supported by all Level0 devices. +// Some opencl extensions we know are supported by all Level Zero devices. constexpr char ZE_SUPPORTED_EXTENSIONS[] = "cl_khr_il_program cl_khr_subgroups cl_intel_subgroups " "cl_intel_subgroups_short cl_intel_required_subgroup_size "; -// Map L0 runtime error code to PI error code +// Map Level Zero runtime error code to PI error code static pi_result mapError(ze_result_t ZeResult) { // TODO: these mapping need to be clarified and synced with the PI API return // values, which is TBD. @@ -369,7 +369,7 @@ pi_result _pi_device::initialize() { // Crate a new command list to be used in a PI call pi_result _pi_device::createCommandList(ze_command_list_handle_t *ZeCommandList) { - // Create the command list, because in L0 commands are added to + // Create the command list, because in Level Zero commands are added to // the command lists, and later are then added to the command queue. // // TODO: Figure out how to lower the overhead of creating a new list @@ -444,7 +444,7 @@ pi_result piPlatformsGet(pi_uint32 NumEntries, pi_platform *Platforms, return PI_INVALID_VALUE; } - // This is a good time to initialize L0. + // This is a good time to initialize Level Zero. // TODO: We can still safely recover if something goes wrong during the init. // Implement handling segfault using sigaction. // TODO: We should not call zeInit multiples times ever, so @@ -463,7 +463,7 @@ pi_result piPlatformsGet(pi_uint32 NumEntries, pi_platform *Platforms, return mapError(ZeResult); } - // L0 does not have concept of Platforms, but L0 driver is the + // Level Zero does not have concept of Platforms, but Level Zero driver is the // closest match. if (Platforms && NumEntries > 0) { uint32_t ZeDriverCount = 0; @@ -529,10 +529,10 @@ pi_result piPlatformGetInfo(pi_platform Platform, pi_platform_info ParamName, switch (ParamName) { case PI_PLATFORM_INFO_NAME: - // TODO: Query L0 driver when relevant info is added there. + // TODO: Query Level Zero driver when relevant info is added there. return ReturnValue("Intel(R) Level-Zero"); case PI_PLATFORM_INFO_VENDOR: - // TODO: Query L0 driver when relevant info is added there. + // TODO: Query Level Zero driver when relevant info is added there. return ReturnValue("Intel(R) Corporation"); case PI_PLATFORM_INFO_EXTENSIONS: // Convention adopted from OpenCL: @@ -543,7 +543,7 @@ pi_result piPlatformGetInfo(pi_platform Platform, pi_platform_info ParamName, // // TODO: Check the common extensions supported by all connected devices and // return them. For now, hardcoding some extensions we know are supported by - // all Level0 devices. + // all Level Zero devices. return ReturnValue(ZE_SUPPORTED_EXTENSIONS); case PI_PLATFORM_INFO_PROFILE: // TODO: figure out what this means and how is this used @@ -571,7 +571,7 @@ pi_result piextPlatformGetNativeHandle(pi_platform Platform, assert(NativeHandle); auto ZeDriver = pi_cast(NativeHandle); - // Extract the L0 driver handle from the given PI platform + // Extract the Level Zero driver handle from the given PI platform *ZeDriver = Platform->ZeDriver; return PI_SUCCESS; } @@ -581,7 +581,7 @@ pi_result piextPlatformCreateWithNativeHandle(pi_native_handle NativeHandle, assert(NativeHandle); assert(Platform); - // Create PI platform from the given L0 driver handle. + // Create PI platform from the given Level Zero driver handle. auto ZeDriver = pi_cast(NativeHandle); *Platform = new _pi_platform(ZeDriver); return PI_SUCCESS; @@ -594,7 +594,7 @@ pi_result piDevicesGet(pi_platform Platform, pi_device_type DeviceType, assert(Platform); ze_driver_handle_t ZeDriver = Platform->ZeDriver; - // Get number of devices supporting L0 + // Get number of devices supporting Level Zero uint32_t ZeDeviceCount = 0; const bool AskingForGPU = (DeviceType & PI_DEVICE_TYPE_GPU); const bool AskingForDefault = (DeviceType == PI_DEVICE_TYPE_DEFAULT); @@ -710,7 +710,7 @@ pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, return ReturnValue(PI_DEVICE_TYPE_GPU); } case PI_DEVICE_INFO_PARENT_DEVICE: - // TODO: all L0 devices are parent ? + // TODO: all Level Zero devices are parent ? return ReturnValue(pi_device{0}); case PI_DEVICE_INFO_PLATFORM: return ReturnValue(Device->Platform); @@ -721,8 +721,8 @@ pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, // "Returns a space separated list of extension names (the extension // names themselves do not contain any spaces) supported by the device." // - // TODO: Use proper mechanism to get this information from Level0 after - // it is added to Level0. + // TODO: Use proper mechanism to get this information from Level Zero after + // it is added to Level Zero. // Hardcoding the few we know are supported by the current hardware. // // @@ -746,7 +746,7 @@ pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, // cl_khr_3d_image_writes - Extension to enable writes to 3D image memory // objects. // - // Hardcoding some extensions we know are supported by all Level0 devices. + // Hardcoding some extensions we know are supported by all Level Zero devices. SupportedExtensions += (ZE_SUPPORTED_EXTENSIONS); if (ZeDeviceKernelProperties.fp16Supported) SupportedExtensions += ("cl_khr_fp16 "); @@ -776,7 +776,7 @@ pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, return ReturnValue(pi_uint32{MaxComputeUnits}); } case PI_DEVICE_INFO_MAX_WORK_ITEM_DIMENSIONS: - // L0 spec defines only three dimensions + // Level Zero spec defines only three dimensions return ReturnValue(pi_uint32{3}); case PI_DEVICE_INFO_MAX_WORK_GROUP_SIZE: return ReturnValue( @@ -837,7 +837,7 @@ pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, return ReturnValue(pi_uint32{Device->RefCount}); case PI_DEVICE_INFO_PARTITION_PROPERTIES: { // It is debatable if SYCL sub-device and partitioning APIs sufficient to - // expose Level0 sub-devices? We start with support of + // expose Level Zero sub-devices? We start with support of // "partition_by_affinity_domain" and "numa" but if that doesn't seem to // be a good fit we could look at adding a more descriptive partitioning // type. @@ -905,7 +905,7 @@ pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, case PI_DEVICE_INFO_MEM_BASE_ADDR_ALIGN: // SYCL/OpenCL spec is vague on what this means exactly, but seems to // be for "alignment requirement (in bits) for sub-buffer offsets." - // An OpenCL implementation returns 8*128, but L0 can do just 8, + // An OpenCL implementation returns 8*128, but Level Zero can do just 8, // meaning unaligned access for values of types larger than 8 bits. return ReturnValue(pi_uint32{8}); case PI_DEVICE_INFO_MAX_SAMPLERS: @@ -987,23 +987,23 @@ pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, return ReturnValue(pi_uint64{DoubleFPValue}); } case PI_DEVICE_INFO_IMAGE2D_MAX_WIDTH: - // Until L0 provides needed info, hardcode default minimum values required + // Until Level Zero provides needed info, hardcode default minimum values required // by the SYCL specification. return ReturnValue(size_t{8192}); case PI_DEVICE_INFO_IMAGE2D_MAX_HEIGHT: - // Until L0 provides needed info, hardcode default minimum values required + // Until Level Zero provides needed info, hardcode default minimum values required // by the SYCL specification. return ReturnValue(size_t{8192}); case PI_DEVICE_INFO_IMAGE3D_MAX_WIDTH: - // Until L0 provides needed info, hardcode default minimum values required + // Until Level Zero provides needed info, hardcode default minimum values required // by the SYCL specification. return ReturnValue(size_t{2048}); case PI_DEVICE_INFO_IMAGE3D_MAX_HEIGHT: - // Until L0 provides needed info, hardcode default minimum values required + // Until Level Zero provides needed info, hardcode default minimum values required // by the SYCL specification. return ReturnValue(size_t{2048}); case PI_DEVICE_INFO_IMAGE3D_MAX_DEPTH: - // Until L0 provides needed info, hardcode default minimum values required + // Until Level Zero provides needed info, hardcode default minimum values required // by the SYCL specification. return ReturnValue(size_t{2048}); case PI_DEVICE_INFO_IMAGE_MAX_BUFFER_SIZE: @@ -1098,7 +1098,7 @@ pi_result piDevicePartition(pi_device Device, const pi_device_partition_property *Properties, pi_uint32 NumDevices, pi_device *OutDevices, pi_uint32 *OutNumDevices) { - // Other partitioning ways are not supported by L0 + // Other partitioning ways are not supported by Level Zero if (Properties[0] != PI_DEVICE_PARTITION_BY_AFFINITY_DOMAIN || Properties[1] != PI_DEVICE_AFFINITY_DOMAIN_NEXT_PARTITIONABLE) { return PI_INVALID_VALUE; @@ -1131,7 +1131,7 @@ pi_result piDevicePartition(pi_device Device, auto ZeSubdevices = new ze_device_handle_t[Count]; ZE_CALL(zeDeviceGetSubDevices(Device->ZeDevice, &Count, ZeSubdevices)); - // Wrap the L0 sub-devices into PI sub-devices, and write them out. + // Wrap the Level Zero sub-devices into PI sub-devices, and write them out. for (uint32_t I = 0; I < Count; ++I) { OutDevices[I] = new _pi_device(ZeSubdevices[I], Device->Platform, true /* isSubDevice */); @@ -1175,14 +1175,14 @@ pi_result piextDeviceGetNativeHandle(pi_device Device, assert(NativeHandle); auto ZeDevice = pi_cast(NativeHandle); - // Extract the L0 module handle from the given PI device + // Extract the Level Zero module handle from the given PI device *ZeDevice = Device->ZeDevice; return PI_SUCCESS; } pi_result piextDeviceCreateWithNativeHandle(pi_native_handle NativeHandle, pi_device *Device) { - // Create PI device from the given L0 device handle. + // Create PI device from the given Level Zero device handle. die("piextDeviceCreateWithNativeHandle: not supported"); return PI_SUCCESS; } @@ -1194,7 +1194,7 @@ pi_result piContextCreate(const pi_context_properties *Properties, void *UserData), void *UserData, pi_context *RetContext) { - // L0 does not have notion of contexts. + // Level Zero does not have notion of contexts. // Return the device handle (only single device is allowed) as a context // handle. if (NumDevices != 1) { @@ -1413,7 +1413,7 @@ pi_result piMemBufferCreate(pi_context Context, pi_mem_flags Flags, size_t Size, (Flags & PI_MEM_FLAGS_HOST_PTR_USE) ? pi_cast(HostPtr) : nullptr; try { *RetMem = new _pi_buffer(Context->Device->Platform, - pi_cast(Ptr) /* L0 Memory Handle */, + pi_cast(Ptr) /* Level Zero Memory Handle */, HostPtrOrNull); } catch (const std::bad_alloc &) { return PI_OUT_OF_HOST_MEMORY; @@ -1708,7 +1708,7 @@ pi_result piclProgramCreateWithSource(pi_context Context, pi_uint32 Count, const size_t *Lengths, pi_program *RetProgram) { - zePrint("piclProgramCreateWithSource: not supported in L0\n"); + zePrint("piclProgramCreateWithSource: not supported in Level Zero\n"); return PI_INVALID_OPERATION; } @@ -1722,7 +1722,7 @@ pi_result piProgramGetInfo(pi_program Program, pi_program_info ParamName, case PI_PROGRAM_INFO_REFERENCE_COUNT: return ReturnValue(pi_uint32{Program->RefCount}); case PI_PROGRAM_INFO_NUM_DEVICES: - // L0 Module is always for a single device. + // Level Zero Module is always for a single device. return ReturnValue(pi_uint32{1}); case PI_PROGRAM_INFO_DEVICES: return ReturnValue(Program->Context->Device); @@ -1746,7 +1746,7 @@ pi_result piProgramGetInfo(pi_program Program, pi_program_info ParamName, case PI_PROGRAM_INFO_KERNEL_NAMES: try { // There are extra allocations/copying here dictated by the difference - // in L0 and PI interfaces. + // in Level Zero and PI interfaces. uint32_t Count = 0; ZE_CALL(zeModuleGetKernelNames(Program->ZeModule, &Count, nullptr)); char **PNames = new char *[Count]; @@ -1777,13 +1777,13 @@ pi_result piProgramLink(pi_context Context, pi_uint32 NumDevices, const pi_program *InputPrograms, void (*PFnNotify)(pi_program Program, void *UserData), void *UserData, pi_program *RetProgram) { - die("piProgramLink: Program Linking is not supported yet in Level0"); + die("piProgramLink: Program Linking is not supported yet in Level Zero"); - // TODO: L0 builds the program at the time of piProgramCreate. + // TODO: Level Zero builds the program at the time of piProgramCreate. // But build options are not available at that time, so we must // stop building it there, but move it here. The problem though // is that this would mean moving zeModuleCreate here entirely, - // and so L0 module creation would be deferred until + // and so Level Zero module creation would be deferred until // piProgramCompile/piProgramLink/piProgramBuild. assert(NumInputPrograms == 1 && InputPrograms); assert(RetProgram); @@ -1797,11 +1797,11 @@ pi_result piProgramCompile( const pi_program *InputHeaders, const char **HeaderIncludeNames, void (*PFnNotify)(pi_program Program, void *UserData), void *UserData) { - // TODO: L0 builds the program at the time of piProgramCreate. + // TODO: Level Zero builds the program at the time of piProgramCreate. // But build options are not available at that time, so we must // stop building it there, but move it here. The problem though // is that this would mean moving zeModuleCreate here entirely, - // and so L0 module creation would be deferred until + // and so Level Zero module creation would be deferred until // piProgramCompile/piProgramLink/piProgramBuild. // // It is expected that program was successfully built during piProgramCreate @@ -1814,11 +1814,11 @@ pi_result piProgramBuild(pi_program Program, pi_uint32 NumDevices, void (*PFnNotify)(pi_program Program, void *UserData), void *UserData) { - // TODO: L0 builds the program at the time of piProgramCreate. + // TODO: Level Zero builds the program at the time of piProgramCreate. // But build options are not available at that time, so we must // stop building it there, but move it here. The problem though // is that this would mean moving zeModuleCreate here entirely, - // and so L0 module creation would be deferred until + // and so Level Zero module creation would be deferred until // piProgramCompile/piProgramLink/piProgramBuild. // // It is expected that program was successfully built during piProgramCreate @@ -1833,14 +1833,14 @@ pi_result piProgramGetBuildInfo(pi_program Program, pi_device Device, ReturnHelper ReturnValue(ParamValueSize, ParamValue, ParamValueSizeRet); if (ParamName == CL_PROGRAM_BINARY_TYPE) { - // TODO: is this the only supported binary type in L0? + // TODO: is this the only supported binary type in Level Zero? // We should probably return CL_PROGRAM_BINARY_TYPE_NONE if asked // before the program was compiled. return ReturnValue( cl_program_binary_type{CL_PROGRAM_BINARY_TYPE_EXECUTABLE}); } if (ParamName == CL_PROGRAM_BUILD_OPTIONS) { - // TODO: how to get module build options out of L0? + // TODO: how to get module build options out of Level Zero? // For the programs that we compiled we can remember the options // passed with piProgramCompile/piProgramBuild, but what can we // return for programs that were built outside and registered @@ -1861,7 +1861,7 @@ pi_result piProgramRelease(pi_program Program) { assert(Program); assert((Program->RefCount > 0) && "Program is already released."); if (--(Program->RefCount) == 0) { - // TODO: call zeModuleDestroy for non-interop L0 modules + // TODO: call zeModuleDestroy for non-interop Level Zero modules delete Program; } return PI_SUCCESS; @@ -2280,7 +2280,7 @@ pi_result piEventGetProfilingInfo(pi_event Event, pi_profiling_info ParamName, } case PI_PROFILING_INFO_COMMAND_QUEUED: case PI_PROFILING_INFO_COMMAND_SUBMIT: - // TODO: Support these when L0 supported is added. + // TODO: Support these when Level Zero supported is added. return ReturnValue(uint64_t{0}); default: zePrint("piEventGetProfilingInfo: not supported ParamName\n"); @@ -2923,7 +2923,7 @@ piEnqueueMemBufferMap(pi_queue Queue, pi_mem Buffer, pi_bool BlockingMap, ZE_CALL(zeCommandListAppendWaitOnEvents(ZeCommandList, NumEventsInWaitList, ZeEventWaitList)); - // TODO: L0 is missing the memory "mapping" capabilities, so we are left + // TODO: Level Zero is missing the memory "mapping" capabilities, so we are left // to doing new memory allocation and a copy (read). // // TODO: check if the input buffer is already allocated in shared @@ -2994,7 +2994,7 @@ pi_result piEnqueueMemUnmap(pi_queue Queue, pi_mem MemObj, void *MappedPtr, ZE_CALL(zeCommandListAppendWaitOnEvents(ZeCommandList, NumEventsInWaitList, ZeEventWaitList)); - // TODO: L0 is missing the memory "mapping" capabilities, so we are left + // TODO: Level Zero is missing the memory "mapping" capabilities, so we are left // to doing copy (write back to the device). // // NOTE: Keep this in sync with the implementation of @@ -3111,7 +3111,7 @@ enqueueMemImageCommandHelper(pi_command_type CommandType, pi_queue Queue, const ze_image_region_t ZeSrcRegion = getImageRegionHelper(SrcMem, SrcOrigin, Region); - // TODO: L0 does not support row_pitch/slice_pitch for images yet. + // TODO: Level Zero does not support row_pitch/slice_pitch for images yet. // Check that SYCL RT did not want pitch larger than default. #ifndef NDEBUG assert(SrcMem->isImage()); @@ -3136,7 +3136,7 @@ enqueueMemImageCommandHelper(pi_command_type CommandType, pi_queue Queue, const ze_image_region_t ZeDstRegion = getImageRegionHelper(DstMem, DstOrigin, Region); - // TODO: L0 does not support row_pitch/slice_pitch for images yet. + // TODO: Level Zero does not support row_pitch/slice_pitch for images yet. // Check that SYCL RT did not want pitch larger than default. #ifndef NDEBUG assert(DstMem->isImage()); @@ -3267,7 +3267,7 @@ pi_result piMemBufferPartition(pi_mem Buffer, pi_mem_flags Flags, *RetMem = new _pi_buffer(Buffer->Platform, pi_cast(Buffer->getZeHandle()) + - Region->origin /* L0 memory handle */, + Region->origin /* Level Zero memory handle */, nullptr /* Host pointer */, Buffer /* Parent buffer */, Region->origin /* Sub-buffer origin */, Region->size /*Sub-buffer size*/); @@ -3313,7 +3313,7 @@ pi_result piextUSMHostAlloc(void **ResultPtr, pi_context Context, ze_host_mem_alloc_desc_t ZeDesc = {}; ZeDesc.flags = ZE_HOST_MEM_ALLOC_FLAG_DEFAULT; - // TODO: translate PI properties to L0 flags + // TODO: translate PI properties to Level Zero flags ZE_CALL(zeDriverAllocHostMem(Context->Device->Platform->ZeDriver, &ZeDesc, Size, Alignment, ResultPtr)); @@ -3330,7 +3330,7 @@ pi_result piextUSMDeviceAlloc(void **ResultPtr, pi_context Context, // Check that incorrect bits are not set in the properties. assert(!Properties || (Properties && !(*Properties & ~PI_MEM_ALLOC_FLAGS))); - // TODO: translate PI properties to L0 flags + // TODO: translate PI properties to Level Zero flags ze_device_mem_alloc_desc_t ZeDesc = {}; ZeDesc.flags = ZE_DEVICE_MEM_ALLOC_FLAG_DEFAULT; ZeDesc.ordinal = 0; @@ -3350,7 +3350,7 @@ pi_result piextUSMSharedAlloc(void **ResultPtr, pi_context Context, // Check that incorrect bits are not set in the properties. assert(!Properties || (Properties && !(*Properties & ~PI_MEM_ALLOC_FLAGS))); - // TODO: translate PI properties to L0 flags + // TODO: translate PI properties to Level Zero flags ze_host_mem_alloc_desc_t ZeHostDesc = {}; ZeHostDesc.flags = ZE_HOST_MEM_ALLOC_FLAG_DEFAULT; ze_device_mem_alloc_desc_t ZeDevDesc = {}; @@ -3462,7 +3462,7 @@ pi_result piextUSMEnqueuePrefetch(pi_queue Queue, const void *Ptr, size_t Size, // TODO: figure out how to translate "flags" ZE_CALL(zeCommandListAppendMemoryPrefetch(ZeCommandList, Ptr, Size)); - // TODO: L0 does not have a completion "event" with the prefetch API, + // TODO: Level Zero does not have a completion "event" with the prefetch API, // so manually add command to signal our event. ZE_CALL(zeCommandListAppendSignalEvent(ZeCommandList, ZeEvent)); @@ -3545,7 +3545,7 @@ pi_result piextUSMEnqueueMemAdvise(pi_queue Queue, const void *Ptr, ZE_CALL(zeCommandListAppendMemAdvise( ZeCommandList, Queue->Context->Device->ZeDevice, Ptr, Length, ZeAdvice)); - // TODO: L0 does not have a completion "event" with the advise API, + // TODO: Level Zero does not have a completion "event" with the advise API, // so manually add command to signal our event. ZE_CALL(zeCommandListAppendSignalEvent(ZeCommandList, ZeEvent)); @@ -3606,7 +3606,7 @@ pi_result piextUSMGetMemAllocInfo(pi_context Context, const void *Ptr, } case PI_MEM_ALLOC_DEVICE: { // TODO: this wants pi_device, but we didn't remember it, and cannot - // deduct from the L0 device. + // deduct from the Level Zero device. die("piextUSMGetMemAllocInfo: PI_MEM_ALLOC_DEVICE not implemented"); break; } diff --git a/sycl/plugins/level_zero/pi_level0.hpp b/sycl/plugins/level_zero/pi_level_zero.hpp similarity index 89% rename from sycl/plugins/level_zero/pi_level0.hpp rename to sycl/plugins/level_zero/pi_level_zero.hpp index ad23384b56724..8a38eab1bdb43 100755 --- a/sycl/plugins/level_zero/pi_level0.hpp +++ b/sycl/plugins/level_zero/pi_level_zero.hpp @@ -1,4 +1,4 @@ -//===---------- pi_level0.hpp - Level Zero Plugin -------------------------===// +//===---------- pi_level_zero.hpp - Level Zero Plugin -------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. @@ -6,17 +6,17 @@ // //===----------------------------------------------------------------------===// -/// \defgroup sycl_pi_level0 Level Zero Plugin +/// \defgroup sycl_pi_level_zero Level Zero Plugin /// \ingroup sycl_pi -/// \file pi_level0.hpp +/// \file pi_level_zero.hpp /// Declarations for Level Zero Plugin. It is the interface between the /// device-agnostic SYCL runtime layer and underlying Level Zero runtime. /// -/// \ingroup sycl_pi_level0 +/// \ingroup sycl_pi_level_zero -#ifndef PI_LEVEL0_HPP -#define PI_LEVEL0_HPP +#ifndef PI_LEVEL_ZERO_HPP +#define PI_LEVEL_ZERO_HPP #include #include @@ -51,17 +51,17 @@ template <> uint32_t pi_cast(uint64_t Value) { struct _pi_object { _pi_object() : RefCount{1} {} - // L0 doesn't do the reference counting, so we have to do. + // Level Zero doesn't do the reference counting, so we have to do. // Must be atomic to prevent data race when incrementing/decrementing. std::atomic RefCount; }; -// Define the types that are opaque in pi.h in a manner suitabale for L0 plugin +// Define the types that are opaque in pi.h in a manner suitabale for Level Zero plugin struct _pi_platform { _pi_platform(ze_driver_handle_t Driver) : ZeDriver{Driver} {} - // L0 lacks the notion of a platform, but there is a driver, which is a + // Level Zero lacks the notion of a platform, but there is a driver, which is a // pretty good fit to keep here. ze_driver_handle_t ZeDriver; @@ -83,13 +83,13 @@ struct _pi_device : _pi_object { // Initialize the entire PI device. pi_result initialize(); - // L0 device handle. + // Level Zero device handle. ze_device_handle_t ZeDevice; // PI platform to which this device belongs. pi_platform Platform; - // Immediate L0 command list for this device, to be used for initializations. + // Immediate Level Zero command list for this device, to be used for initializations. // To be created as: // - Immediate command list: So any command appended to it is immediately // offloaded to the device. @@ -117,7 +117,7 @@ struct _pi_context : _pi_object { : Device{Device}, ZeEventPool{nullptr}, NumEventsAvailableInEventPool{}, NumEventsLiveInEventPool{} {} - // L0 does not have notion of contexts. + // Level Zero does not have notion of contexts. // Keep the device here (must be exactly one) to return it when PI context // is queried for devices. pi_device Device; @@ -164,7 +164,7 @@ struct _pi_queue : _pi_object { _pi_queue(ze_command_queue_handle_t Queue, pi_context Context) : ZeCommandQueue{Queue}, Context{Context} {} - // L0 command queue handle. + // Level Zero command queue handle. ze_command_queue_handle_t ZeCommandQueue; // Keeps the PI context to which this queue belongs. @@ -197,10 +197,10 @@ struct _pi_mem : _pi_object { // Interface of the _pi_mem object - // Get the L0 handle of the current memory object + // Get the Level Zero handle of the current memory object virtual void *getZeHandle() = 0; - // Get a pointer to the L0 handle of the current memory object + // Get a pointer to the Level Zero handle of the current memory object virtual void *getZeHandlePtr() = 0; // Method to get type of the derived object (image or buffer) @@ -241,7 +241,7 @@ struct _pi_buffer final : _pi_mem { bool isSubBuffer() const { return SubBuffer.Parent != nullptr; } - // L0 memory handle is really just a naked pointer. + // Level Zero memory handle is really just a naked pointer. // It is just convenient to have it char * to simplify offset arithmetics. char *ZeMem; @@ -268,7 +268,7 @@ struct _pi_image final : _pi_mem { ze_image_desc_t ZeImageDesc; #endif // !NDEBUG - // L0 image handle. + // Level Zero image handle. ze_image_handle_t ZeImage; }; @@ -278,12 +278,12 @@ struct _pi_event : _pi_object { : ZeEvent{ZeEvent}, ZeEventPool{ZeEventPool}, ZeCommandList{nullptr}, CommandType{CommandType}, Context{Context}, CommandData{nullptr} {} - // L0 event handle. + // Level Zero event handle. ze_event_handle_t ZeEvent; - // L0 event pool handle. + // Level Zero event pool handle. ze_event_pool_handle_t ZeEventPool; - // L0 command list where the command signaling this event was appended to. + // Level Zero command list where the command signaling this event was appended to. // This is currently used to remember/destroy the command list after // all commands in it are completed, i.e. this event signaled. ze_command_list_handle_t ZeCommandList; @@ -300,7 +300,7 @@ struct _pi_event : _pi_object { // Opaque data to hold any data needed for CommandType. void *CommandData; - // Methods for translating PI events list into L0 events list + // Methods for translating PI events list into Level Zero events list static ze_event_handle_t *createZeEventList(pi_uint32, const pi_event *); static void deleteZeEventList(ze_event_handle_t *); }; @@ -309,7 +309,7 @@ struct _pi_program : _pi_object { _pi_program(ze_module_handle_t Module, pi_context Context) : ZeModule{Module}, Context{Context} {} - // L0 module handle. + // Level Zero module handle. ze_module_handle_t ZeModule; // Keep the context of the program. @@ -320,7 +320,7 @@ struct _pi_kernel : _pi_object { _pi_kernel(ze_kernel_handle_t Kernel, pi_program Program) : ZeKernel{Kernel}, Program{Program} {} - // L0 function handle. + // Level Zero function handle. ze_kernel_handle_t ZeKernel; // Keep the program of the kernel. @@ -330,11 +330,11 @@ struct _pi_kernel : _pi_object { struct _pi_sampler : _pi_object { _pi_sampler(ze_sampler_handle_t Sampler) : ZeSampler{Sampler} {} - // L0 sampler handle. - // TODO: It is important that L0 handler is the first data member. Workaround + // Level Zero sampler handle. + // TODO: It is important that Level Zero handler is the first data member. Workaround // in SYCL RT (in ExecCGCommand::enqueueImp()) relies on this. This comment // should be removed when workaround in SYCL runtime will be removed. ze_sampler_handle_t ZeSampler; }; -#endif // PI_LEVEL0_HPP +#endif // PI_LEVEL_ZERO_HPP diff --git a/sycl/source/detail/config.hpp b/sycl/source/detail/config.hpp index f19816e8995e4..09c670152895c 100644 --- a/sycl/source/detail/config.hpp +++ b/sycl/source/detail/config.hpp @@ -15,6 +15,7 @@ #include #include #include +#include #include __SYCL_INLINE_NAMESPACE(cl) { @@ -111,6 +112,7 @@ template <> class SYCLConfig { static backend *get() { static bool Initialized = false; static backend *BackendPtr = nullptr; + const char *newStr = "PI_LEVEL_ZERO"; // Configuration parameters are processed only once, like reading a string // from environment and converting it into a typed object. @@ -120,9 +122,12 @@ template <> class SYCLConfig { const char *ValStr = BaseT::getRawValue(); const std::array, 3> SyclBeMap = { {{"PI_OPENCL", backend::opencl}, - {"PI_LEVEL0", backend::level_zero}, + {"PI_LEVEL_ZERO", backend::level_zero}, {"PI_CUDA", backend::cuda}}}; if (ValStr) { + if (strcmp(ValStr, "PI_LEVEL0") == 0) { + ValStr = newStr; + } auto It = std::find_if( std::begin(SyclBeMap), std::end(SyclBeMap), [&ValStr](const std::pair &element) { @@ -130,7 +135,7 @@ template <> class SYCLConfig { }); if (It == SyclBeMap.end()) pi::die("Invalid backend. " - "Valid values are PI_OPENCL/PI_LEVEL0/PI_CUDA"); + "Valid values are PI_OPENCL/PI_LEVEL_ZERO/PI_CUDA"); static backend Backend = It->second; BackendPtr = &Backend; } diff --git a/sycl/source/detail/pi.cpp b/sycl/source/detail/pi.cpp index 786f61416d2e0..71580d24f4bcf 100644 --- a/sycl/source/detail/pi.cpp +++ b/sycl/source/detail/pi.cpp @@ -215,7 +215,7 @@ bool findPlugins(vector_class> &PluginNames) { // env only. // PluginNames.emplace_back(OPENCL_PLUGIN_NAME, backend::opencl); - PluginNames.emplace_back(LEVEL0_PLUGIN_NAME, backend::level_zero); + PluginNames.emplace_back(LEVEL_ZERO_PLUGIN_NAME, backend::level_zero); PluginNames.emplace_back(CUDA_PLUGIN_NAME, backend::cuda); return true; } diff --git a/sycl/source/detail/program_manager/program_manager.cpp b/sycl/source/detail/program_manager/program_manager.cpp index 77a7153ce0af2..9f9a77b7a7b59 100644 --- a/sycl/source/detail/program_manager/program_manager.cpp +++ b/sycl/source/detail/program_manager/program_manager.cpp @@ -762,10 +762,10 @@ ProgramManager::build(ProgramPtr Program, const ContextImplPtr Context, LinkOpts = LinkOptions.c_str(); } - // L0 plugin doesn't support piProgramCompile/piProgramLink commands, program + // Level-Zero plugin doesn't support piProgramCompile/piProgramLink commands, program // is built during piProgramCreate. // TODO: remove this check as soon as piProgramCompile/piProgramLink will be - // implemented in L0 plugin. + // implemented in Level-Zero plugin. if (Context->getPlugin().getBackend() == backend::level_zero) { LinkDeviceLibs = false; } diff --git a/sycl/test/CMakeLists.txt b/sycl/test/CMakeLists.txt index 00df5fd456ad3..2977e07d6c22d 100644 --- a/sycl/test/CMakeLists.txt +++ b/sycl/test/CMakeLists.txt @@ -77,15 +77,15 @@ add_lit_target(check-sycl-inline-asm DEPENDS ${SYCL_TEST_DEPS} ) -add_lit_testsuite(check-level0 "Running the SYCL regression tests for Level Zero" +add_lit_testsuite(check-level-zero "Running the SYCL regression tests for Level Zero" ${CMAKE_CURRENT_BINARY_DIR} ARGS ${RT_TEST_ARGS} - PARAMS "SYCL_BE=PI_LEVEL0" + PARAMS "SYCL_BE=PI_LEVEL_ZERO" DEPENDS ${SYCL_TEST_DEPS} EXCLUDE_FROM_CHECK_ALL ) -add_dependencies(check-sycl check-level0) +add_dependencies(check-sycl check-level-zero) if(SYCL_BUILD_PI_CUDA) add_lit_testsuite(check-sycl-cuda "Running the SYCL regression tests for CUDA" diff --git a/sycl/test/abi/pi_level0_symbol_check.dump b/sycl/test/abi/pi_level_zero_symbol_check.dump similarity index 98% rename from sycl/test/abi/pi_level0_symbol_check.dump rename to sycl/test/abi/pi_level_zero_symbol_check.dump index 68b2d0c0e0c6b..fd50893724b3a 100644 --- a/sycl/test/abi/pi_level0_symbol_check.dump +++ b/sycl/test/abi/pi_level_zero_symbol_check.dump @@ -1,4 +1,4 @@ -# RUN: env LLVM_BIN_PATH=%llvm_build_bin_dir python %sycl_tools_src_dir/abi_check.py --mode check_symbols --reference %s %sycl_libs_dir/libpi_level0.so +# RUN: env LLVM_BIN_PATH=%llvm_build_bin_dir python %sycl_tools_src_dir/abi_check.py --mode check_symbols --reference %s %sycl_libs_dir/libpi_level_zero.so # REQUIRES: linux piDeviceGetInfo @@ -101,4 +101,3 @@ piEnqueueMemBufferWriteRect piextUSMHostAlloc piextPlatformGetNativeHandle piextPlatformCreateWithNativeHandle - diff --git a/sycl/test/basic_tests/buffer/reinterpret.cpp b/sycl/test/basic_tests/buffer/reinterpret.cpp index 7fd000f165131..7288d9bfb2c97 100644 --- a/sycl/test/basic_tests/buffer/reinterpret.cpp +++ b/sycl/test/basic_tests/buffer/reinterpret.cpp @@ -3,7 +3,7 @@ // RUN: %GPU_RUN_PLACEHOLDER %t.out // RUN: %ACC_RUN_PLACEHOLDER %t.out // -// XFAIL: level0 +// XFAIL: level_zero //==---------- reinterpret.cpp --- SYCL buffer reinterpret basic test ------==// // diff --git a/sycl/test/basic_tests/image_accessor_readsampler.cpp b/sycl/test/basic_tests/image_accessor_readsampler.cpp index fd93c37357aa1..8077e43c36853 100644 --- a/sycl/test/basic_tests/image_accessor_readsampler.cpp +++ b/sycl/test/basic_tests/image_accessor_readsampler.cpp @@ -6,7 +6,7 @@ // RUN: %CPU_RUN_PLACEHOLDER %t.out // RUN: %GPU_RUN_PLACEHOLDER %t.out // -// XFAIL: level0 +// XFAIL: level_zero //==------------------- image_accessor_readsampler.cpp ---------------------==// //==-----------------image_accessor read API test with sampler--------------==// // diff --git a/sycl/test/basic_tests/image_accessor_readwrite.cpp b/sycl/test/basic_tests/image_accessor_readwrite.cpp index 13c0b175bd1fc..0451ced85dc55 100644 --- a/sycl/test/basic_tests/image_accessor_readwrite.cpp +++ b/sycl/test/basic_tests/image_accessor_readwrite.cpp @@ -6,7 +6,7 @@ // RUN: %CPU_RUN_PLACEHOLDER %t.out // RUN: %GPU_RUN_PLACEHOLDER %t.out // -// XFAIL: windows && level0 +// XFAIL: windows && level_zero //==--------------------image_accessor_readwrite.cpp ----------------------==// //==----------image_accessor read without sampler & write API test---------==// diff --git a/sycl/test/basic_tests/image_accessor_readwrite_half.cpp b/sycl/test/basic_tests/image_accessor_readwrite_half.cpp index 6d5c1960655e5..931780c6c36a6 100644 --- a/sycl/test/basic_tests/image_accessor_readwrite_half.cpp +++ b/sycl/test/basic_tests/image_accessor_readwrite_half.cpp @@ -6,7 +6,7 @@ // RUN: %CPU_RUN_PLACEHOLDER %t.out // RUN: %GPU_RUN_PLACEHOLDER %t.out // -// XFAIL: windows && level0 +// XFAIL: windows && level_zero //==--------------------image_accessor_readwrite_half.cpp -------------------==// //==-image_accessor read (without sampler)& write API test for half datatype-==// diff --git a/sycl/test/basic_tests/kernel_info.cpp b/sycl/test/basic_tests/kernel_info.cpp index 193d89a4c4bd8..68a642b476e27 100644 --- a/sycl/test/basic_tests/kernel_info.cpp +++ b/sycl/test/basic_tests/kernel_info.cpp @@ -3,8 +3,8 @@ // RUN: %GPU_RUN_PLACEHOLDER %t.out // RUN: %ACC_RUN_PLACEHOLDER %t.out // -// Fail is flaky for level0, enable when fixed. -// UNSUPPORTED: level0 +// Fail is flaky for level_zero, enable when fixed. +// UNSUPPORTED: level_zero //==--- kernel_info.cpp - SYCL kernel info test ----------------------------==// // diff --git a/sycl/test/basic_tests/parallel_for_indexers.cpp b/sycl/test/basic_tests/parallel_for_indexers.cpp index ade6238b8c6c0..4c512d5da48d9 100644 --- a/sycl/test/basic_tests/parallel_for_indexers.cpp +++ b/sycl/test/basic_tests/parallel_for_indexers.cpp @@ -8,7 +8,7 @@ // TODO: Unexpected result // TODO: _indexers.cpp:37: int main(): Assertion `id == -1' failed. -// XFAIL: cuda || level0 +// XFAIL: cuda || level_zero #include diff --git a/sycl/test/basic_tests/parallel_for_range.cpp b/sycl/test/basic_tests/parallel_for_range.cpp index d5ed05868d1c3..f84fa90ef418a 100644 --- a/sycl/test/basic_tests/parallel_for_range.cpp +++ b/sycl/test/basic_tests/parallel_for_range.cpp @@ -1,4 +1,4 @@ -// XFAIL: cuda || level0 +// XFAIL: cuda || level_zero // CUDA exposes broken hierarchical parallelism. // RUN: %clangxx -fsycl -fsycl-targets=%sycl_triple %s -o %t.out diff --git a/sycl/test/host-interop-task/host-task-dependency.cpp b/sycl/test/host-interop-task/host-task-dependency.cpp index 60a1e60883d71..2bbc059a43e44 100644 --- a/sycl/test/host-interop-task/host-task-dependency.cpp +++ b/sycl/test/host-interop-task/host-task-dependency.cpp @@ -4,7 +4,7 @@ // RUN: %ACC_RUN_PLACEHOLDER SYCL_PI_TRACE=-1 %t.out 2>&1 %ACC_CHECK_PLACEHOLDER // // TODO: Behaviour is unstable for level zero on Windows. Enable when fixed. -// UNSUPPORTED: windows && level0 +// UNSUPPORTED: windows && level_zero #include #include diff --git a/sycl/test/host-interop-task/host-task-two-queues.cpp b/sycl/test/host-interop-task/host-task-two-queues.cpp index 5157b83b60092..7644d6bcfcd53 100644 --- a/sycl/test/host-interop-task/host-task-two-queues.cpp +++ b/sycl/test/host-interop-task/host-task-two-queues.cpp @@ -4,7 +4,7 @@ // RUN: %ACC_RUN_PLACEHOLDER %t.out // // TODO: Flaky fail on Level Zero that is why mark as unsupported temporarily. -// UNSUPPORTED: level0 +// UNSUPPORTED: level_zero #include #include diff --git a/sycl/test/host-interop-task/interop-task.cpp b/sycl/test/host-interop-task/interop-task.cpp index 6db65398e06bb..e22cdb2fedfab 100644 --- a/sycl/test/host-interop-task/interop-task.cpp +++ b/sycl/test/host-interop-task/interop-task.cpp @@ -2,7 +2,7 @@ // RUN: %CPU_RUN_PLACEHOLDER %t.out // RUN: %GPU_RUN_PLACEHOLDER %t.out // RUN: %ACC_RUN_PLACEHOLDER %t.out -// USUPPORTED: level0, cuda +// USUPPORTED: level_zero, cuda // REQUIRES: opencl #include diff --git a/sycl/test/lit.cfg.py b/sycl/test/lit.cfg.py index 545ebb995f60d..f2a58749a2a93 100644 --- a/sycl/test/lit.cfg.py +++ b/sycl/test/lit.cfg.py @@ -81,7 +81,7 @@ def getDeviceCount(device_type): is_cuda = False; - is_level0 = False; + is_level_zero = False; process = subprocess.Popen([get_device_count_by_type_path, device_type, backend], stdout=subprocess.PIPE) (output, err) = process.communicate() @@ -106,12 +106,12 @@ def getDeviceCount(device_type): if re.match(r".*cuda", result[1]): is_cuda = True; if re.match(r".*level zero", result[1]): - is_level0 = True; + is_level_zero = True; if err: lit_config.warning("getDeviceCount {TYPE} {BACKEND} stderr:{ERR}".format( TYPE=device_type, BACKEND=backend, ERR=err)) - return [value,is_cuda,is_level0] + return [value,is_cuda,is_level_zero] # Every SYCL implementation provides a host implementation. config.available_features.add('host') @@ -149,8 +149,8 @@ def getDeviceCount(device_type): gpu_check_on_linux_substitute = "" cuda = False -level0 = False -[gpu_count, cuda, level0] = getDeviceCount("gpu") +level_zero = False +[gpu_count, cuda, level_zero] = getDeviceCount("gpu") if gpu_count > 0: found_at_least_one_device = True @@ -160,8 +160,8 @@ def getDeviceCount(device_type): config.available_features.add('gpu') if cuda: config.available_features.add('cuda') - elif level0: - config.available_features.add('level0') + elif level_zero: + config.available_features.add('level_zero') if platform.system() == "Linux": gpu_run_on_linux_substitute = "env SYCL_DEVICE_TYPE=GPU SYCL_BE={SYCL_BE} ".format(SYCL_BE=backend) @@ -188,7 +188,7 @@ def getDeviceCount(device_type): config.substitutions.append( ('%ACC_CHECK_PLACEHOLDER', acc_check_substitute) ) # LIT testing either supports OpenCL or CUDA or Level Zero. -if not cuda and not level0 and found_at_least_one_device: +if not cuda and not level_zero and found_at_least_one_device: config.available_features.add('opencl') if cuda: diff --git a/sycl/test/regression/fsycl-save-temps.cpp b/sycl/test/regression/fsycl-save-temps.cpp index ce9e653af2608..7f89fa54feeca 100644 --- a/sycl/test/regression/fsycl-save-temps.cpp +++ b/sycl/test/regression/fsycl-save-temps.cpp @@ -22,6 +22,6 @@ int main() { } // TODO: Address a Windows-specific issue with integration header filenames -// XFAIL: system-windows && !level0 +// XFAIL: system-windows && !level_zero // TODO: fail is flaky on Windows for Level Zero. Enable when fixed. -// UNSUPPORTED: system-windows && level0 +// UNSUPPORTED: system-windows && level_zero diff --git a/sycl/test/regression/image_access.cpp b/sycl/test/regression/image_access.cpp index f32d0a33f6b91..e779fb5b4111b 100644 --- a/sycl/test/regression/image_access.cpp +++ b/sycl/test/regression/image_access.cpp @@ -5,9 +5,9 @@ // TODO: For now PI checks are skipped for ACC device. To decide if it's good. // RUN: env %ACC_RUN_PLACEHOLDER %t.out // -// UNSUPPORTED: cuda || windows && level0 +// UNSUPPORTED: cuda || windows && level_zero // CUDA cannot support OpenCL spec conform images. -// TODO: test hangs on level0, enable when fixed. +// TODO: test hangs on level_zero, enable when fixed. //==-------------- image_access.cpp - SYCL image accessors test -----------==// // diff --git a/sycl/test/regression/static-buffer-dtor.cpp b/sycl/test/regression/static-buffer-dtor.cpp index 5899420c20454..c541c180e7d73 100644 --- a/sycl/test/regression/static-buffer-dtor.cpp +++ b/sycl/test/regression/static-buffer-dtor.cpp @@ -14,7 +14,7 @@ // RUN: %GPU_RUN_PLACEHOLDER %t.out // RUN: %ACC_RUN_PLACEHOLDER %t.out // -// XFAIL: linux && level0 +// XFAIL: linux && level_zero #include diff --git a/sycl/test/spec_const/spec_const_hw.cpp b/sycl/test/spec_const/spec_const_hw.cpp index 6e051910ce680..b9eb539af8b35 100644 --- a/sycl/test/spec_const/spec_const_hw.cpp +++ b/sycl/test/spec_const/spec_const_hw.cpp @@ -6,7 +6,7 @@ // TODO: re-enable after CI drivers are updated to newer which support spec // constants: // XFAIL: linux && opencl -// UNSUPPORTED: cuda || level0 +// UNSUPPORTED: cuda || level_zero // //==----------- spec_const_hw.cpp ------------------------------------------==// // diff --git a/sycl/test/spec_const/spec_const_neg.cpp b/sycl/test/spec_const/spec_const_neg.cpp index 18fb8ed5d9d0c..7312e29ab40e1 100644 --- a/sycl/test/spec_const/spec_const_neg.cpp +++ b/sycl/test/spec_const/spec_const_neg.cpp @@ -3,7 +3,7 @@ // RUN: %CPU_RUN_PLACEHOLDER %t.out // RUN: %GPU_RUN_PLACEHOLDER %t.out // Specialization constants are not supported on FPGA h/w and emulator. -// UNSUPPORTED: cuda || level0 +// UNSUPPORTED: cuda || level_zero // //==----------- spec_const_hw.cpp ------------------------------------------==// // diff --git a/sycl/test/spec_const/spec_const_redefine.cpp b/sycl/test/spec_const/spec_const_redefine.cpp index ac65587905bf0..da80365865c42 100644 --- a/sycl/test/spec_const/spec_const_redefine.cpp +++ b/sycl/test/spec_const/spec_const_redefine.cpp @@ -6,7 +6,7 @@ // TODO: re-enable after CI drivers are updated to newer which support spec // constants: // XFAIL: linux && opencl -// UNSUPPORTED: cuda || level0 +// UNSUPPORTED: cuda || level_zero // //==----------- spec_const_redefine.cpp ------------------------------------==// // diff --git a/sycl/test/usm/allocator_vector.cpp b/sycl/test/usm/allocator_vector.cpp index 265c071e1cf0e..16b086a4bac3c 100644 --- a/sycl/test/usm/allocator_vector.cpp +++ b/sycl/test/usm/allocator_vector.cpp @@ -1,4 +1,4 @@ -// XFAIL: cuda || level0 +// XFAIL: cuda || level_zero // piextUSM*Alloc functions for CUDA are not behaving as described in // https://github.com/intel/llvm/blob/sycl/sycl/doc/extensions/USM/USM.adoc // https://github.com/intel/llvm/blob/sycl/sycl/doc/extensions/USM/cl_intel_unified_shared_memory.asciidoc diff --git a/sycl/tools/get_device_count_by_type.cpp b/sycl/tools/get_device_count_by_type.cpp index 26a9a0a4ed6ad..abf70ce98c357 100644 --- a/sycl/tools/get_device_count_by_type.cpp +++ b/sycl/tools/get_device_count_by_type.cpp @@ -32,7 +32,7 @@ static const std::string help = " Help\n" " Example: ./get_device_count_by_type cpu opencl\n" " Supported device types: cpu/gpu/accelerator/default/all\n" - " Supported backends: PI_CUDA/PI_OPENCL/PI_LEVEL0 \n" + " Supported backends: PI_CUDA/PI_OPENCL/PI_LEVEL_ZERO \n" " Output format: :"; // Return the string with all characters translated to lower case. @@ -259,7 +259,7 @@ int main(int argc, char *argv[]) { if (backend == "opencl" || backend == "pi_opencl") { querySuccess = queryOpenCL(deviceType, deviceCount, msg); - } else if (backend == "level0" || backend == "pi_level0") { + } else if (backend == "level_zero" || backend == "pi_level_zero") { querySuccess = queryLevelZero(deviceType, deviceCount, msg); } else if (backend == "cuda" || backend == "pi_cuda") { querySuccess = queryCUDA(deviceType, deviceCount, msg); From 91f729a5b4e59ec35ba0f26ecac77f1b1cb13150 Mon Sep 17 00:00:00 2001 From: Gail Lyons Date: Tue, 14 Jul 2020 05:43:50 -0700 Subject: [PATCH 3/9] Resolving merge updates Signed-off-by: Gail Lyons --- sycl/include/CL/sycl/backend/level_zero.hpp | 22 ++++++++++----------- sycl/source/backend/level_zero.cpp | 18 ++++++++--------- sycl/source/detail/pi.cpp | 10 +++++----- sycl/source/device_selector.cpp | 4 ++-- sycl/test/abi/sycl_symbols_linux.dump | 15 +++++++------- sycl/test/plugins/sycl-ls-gpu-default.cpp | 2 +- 6 files changed, 35 insertions(+), 36 deletions(-) diff --git a/sycl/include/CL/sycl/backend/level_zero.hpp b/sycl/include/CL/sycl/backend/level_zero.hpp index 54a1a04d5f996..2187525bffa33 100644 --- a/sycl/include/CL/sycl/backend/level_zero.hpp +++ b/sycl/include/CL/sycl/backend/level_zero.hpp @@ -14,30 +14,30 @@ __SYCL_INLINE_NAMESPACE(cl) { namespace sycl { -template <> struct interop { +template <> struct interop { using type = ze_driver_handle_t; }; -template <> struct interop { +template <> struct interop { using type = ze_device_handle_t; }; -template <> struct interop { +template <> struct interop { using type = ze_command_queue_handle_t; }; -template <> struct interop { +template <> struct interop { using type = ze_module_handle_t; }; template -struct interop> { using type = char *; }; -namespace level0 { +namespace level_zero { // Implementation of various "make" functions resides in libsycl.so platform make_platform(pi_native_handle NativeHandle); @@ -48,7 +48,7 @@ queue make_queue(const context &Context, pi_native_handle InteropHandle); // Construction of SYCL platform. template ::value>::type * = nullptr> -T make(typename interop::type Interop) { +T make(typename interop::type Interop) { return make_platform(reinterpret_cast(Interop)); } @@ -56,7 +56,7 @@ T make(typename interop::type Interop) { template ::value>::type * = nullptr> T make(const platform &Platform, - typename interop::type Interop) { + typename interop::type Interop) { return make_device(Platform, reinterpret_cast(Interop)); } @@ -64,7 +64,7 @@ T make(const platform &Platform, template ::value>::type * = nullptr> T make(const context &Context, - typename interop::type Interop) { + typename interop::type Interop) { return make_program(Context, reinterpret_cast(Interop)); } @@ -72,10 +72,10 @@ T make(const context &Context, template ::value>::type * = nullptr> T make(const context &Context, - typename interop::type Interop) { + typename interop::type Interop) { return make_queue(Context, reinterpret_cast(Interop)); } -} // namespace level0 +} // namespace level_zero } // namespace sycl } // __SYCL_INLINE_NAMESPACE(cl) diff --git a/sycl/source/backend/level_zero.cpp b/sycl/source/backend/level_zero.cpp index 2e62223c0301e..6d7c7a347e89d 100644 --- a/sycl/source/backend/level_zero.cpp +++ b/sycl/source/backend/level_zero.cpp @@ -14,13 +14,13 @@ __SYCL_INLINE_NAMESPACE(cl) { namespace sycl { -namespace level0 { +namespace level_zero { using namespace detail; //---------------------------------------------------------------------------- -// Implementation of level0::make +// Implementation of level_zero::make __SYCL_EXPORT platform make_platform(pi_native_handle NativeHandle) { - const auto &Plugin = pi::getPlugin(); + const auto &Plugin = pi::getPlugin(); // Create PI platform first. pi::PiPlatform PiPlatform; Plugin.call(NativeHandle, @@ -32,10 +32,10 @@ __SYCL_EXPORT platform make_platform(pi_native_handle NativeHandle) { } //---------------------------------------------------------------------------- -// Implementation of level0::make +// Implementation of level_zero::make __SYCL_EXPORT device make_device(const platform &Platform, pi_native_handle NativeHandle) { - const auto &Plugin = pi::getPlugin(); + const auto &Plugin = pi::getPlugin(); const auto &PlatformImpl = getSyclObjImpl(Platform); // Create PI device first. pi::PiDevice PiDevice; @@ -47,7 +47,7 @@ __SYCL_EXPORT device make_device(const platform &Platform, } //---------------------------------------------------------------------------- -// Implementation of level0::make +// Implementation of level_zero::make __SYCL_EXPORT program make_program(const context &Context, pi_native_handle NativeHandle) { // Construct the SYCL program from native program. @@ -58,10 +58,10 @@ __SYCL_EXPORT program make_program(const context &Context, } //---------------------------------------------------------------------------- -// Implementation of level0::make +// Implementation of level_zero::make __SYCL_EXPORT queue make_queue(const context &Context, pi_native_handle NativeHandle) { - const auto &Plugin = pi::getPlugin(); + const auto &Plugin = pi::getPlugin(); const auto &ContextImpl = getSyclObjImpl(Context); // Create PI queue first. pi::PiQueue PiQueue; @@ -72,6 +72,6 @@ __SYCL_EXPORT queue make_queue(const context &Context, PiQueue, ContextImpl, ContextImpl->get_async_handler())); } -} // namespace level0 +} // namespace level_zero } // namespace sycl } // __SYCL_INLINE_NAMESPACE(cl) diff --git a/sycl/source/detail/pi.cpp b/sycl/source/detail/pi.cpp index 54c0251d164fc..eecd3e965ae28 100644 --- a/sycl/source/detail/pi.cpp +++ b/sycl/source/detail/pi.cpp @@ -319,11 +319,11 @@ static void initializePlugins(vector_class *Plugins) { PluginNames[I].first.find("cuda") != std::string::npos) { // Use the CUDA plugin as the GlobalPlugin GlobalPlugin = std::make_shared(PluginInformation, backend::cuda); - } else if (InteropBE == backend::level0 && - PluginNames[I].first.find("level0") != std::string::npos) { - // Use the LEVEL0 plugin as the GlobalPlugin + } else if (InteropBE == backend::level_zero && + PluginNames[I].first.find("level_zero") != std::string::npos) { + // Use the LEVEL_ZERO plugin as the GlobalPlugin GlobalPlugin = - std::make_shared(PluginInformation, backend::level0); + std::make_shared(PluginInformation, backend::level_zero); } Plugins->emplace_back(plugin(PluginInformation, PluginNames[I].second)); if (trace(TraceLevel::PI_TRACE_BASIC)) @@ -395,7 +395,7 @@ template const plugin &getPlugin() { } template const plugin &getPlugin(); -template const plugin &getPlugin(); +template const plugin &getPlugin(); // Report error and no return (keeps compiler from printing warnings). // TODO: Probably change that to throw a catchable exception, diff --git a/sycl/source/device_selector.cpp b/sycl/source/device_selector.cpp index ce6011439f4bf..b609b947d1410 100644 --- a/sycl/source/device_selector.cpp +++ b/sycl/source/device_selector.cpp @@ -19,13 +19,13 @@ __SYCL_INLINE_NAMESPACE(cl) { namespace sycl { // Utility function to check if device is of the preferred backend. -// Currently preference is given to the level0 backend. +// Currently preference is given to the level_zero backend. static bool isDeviceOfPreferredSyclBe(const device &Device) { if (Device.is_host()) return false; return detail::getSyclObjImpl(Device)->getPlugin().getBackend() == - backend::level0; + backend::level_zero; } device device_selector::select_device() const { diff --git a/sycl/test/abi/sycl_symbols_linux.dump b/sycl/test/abi/sycl_symbols_linux.dump index 1425b82d13d52..a9c92619a68bb 100644 --- a/sycl/test/abi/sycl_symbols_linux.dump +++ b/sycl/test/abi/sycl_symbols_linux.dump @@ -3584,6 +3584,10 @@ _ZN2cl10__host_std9u_sub_satEhh _ZN2cl10__host_std9u_sub_satEjj _ZN2cl10__host_std9u_sub_satEmm _ZN2cl10__host_std9u_sub_satEtt +_ZN2cl4sycl10level_zero10make_queueERKNS0_7contextEm +_ZN2cl4sycl10level_zero11make_deviceERKNS0_8platformEm +_ZN2cl4sycl10level_zero12make_programERKNS0_7contextEm +_ZN2cl4sycl10level_zero13make_platformEm _ZN2cl4sycl11malloc_hostEmRKNS0_5queueE _ZN2cl4sycl11malloc_hostEmRKNS0_7contextE _ZN2cl4sycl13aligned_allocEmmRKNS0_5queueENS0_3usm5allocE @@ -3724,7 +3728,9 @@ _ZN2cl4sycl6detail13MemoryManager13releaseMemObjESt10shared_ptrINS1_12context_im _ZN2cl4sycl6detail13MemoryManager16allocateMemImageESt10shared_ptrINS1_12context_implEEPNS1_11SYCLMemObjIEPvbmRK14_pi_image_descRK16_pi_image_formatRKS3_INS1_10event_implEERKS5_RP9_pi_event _ZN2cl4sycl6detail13MemoryManager17allocateMemBufferESt10shared_ptrINS1_12context_implEEPNS1_11SYCLMemObjIEPvbmRKS3_INS1_10event_implEERKS5_RP9_pi_event _ZN2cl4sycl6detail13MemoryManager18allocateHostMemoryEPNS1_11SYCLMemObjIEPvbm +_ZN2cl4sycl6detail13MemoryManager18releaseImageBufferESt10shared_ptrINS1_12context_implEEPv _ZN2cl4sycl6detail13MemoryManager19allocateImageObjectESt10shared_ptrINS1_12context_implEEPvbRK14_pi_image_descRK16_pi_image_format +_ZN2cl4sycl6detail13MemoryManager19wrapIntoImageBufferESt10shared_ptrINS1_12context_implEEPvPNS1_11SYCLMemObjIE _ZN2cl4sycl6detail13MemoryManager20allocateBufferObjectESt10shared_ptrINS1_12context_implEEPvbm _ZN2cl4sycl6detail13MemoryManager20allocateMemSubBufferESt10shared_ptrINS1_12context_implEEPvmmNS0_5rangeILi3EEESt6vectorIS3_INS1_10event_implEESaISB_EERP9_pi_event _ZN2cl4sycl6detail13MemoryManager24allocateInteropMemObjectESt10shared_ptrINS1_12context_implEEPvRKS3_INS1_10event_implEERKS5_RP9_pi_event @@ -3736,8 +3742,6 @@ _ZN2cl4sycl6detail13MemoryManager7releaseESt10shared_ptrINS1_12context_implEEPNS _ZN2cl4sycl6detail13MemoryManager8allocateESt10shared_ptrINS1_12context_implEEPNS1_11SYCLMemObjIEbPvSt6vectorIS3_INS1_10event_implEESaISB_EERP9_pi_event _ZN2cl4sycl6detail13MemoryManager8copy_usmEPKvSt10shared_ptrINS1_10queue_implEEmPvSt6vectorIP9_pi_eventSaISB_EERSB_ _ZN2cl4sycl6detail13MemoryManager8fill_usmEPvSt10shared_ptrINS1_10queue_implEEmiSt6vectorIP9_pi_eventSaIS9_EERS9_ -_ZN2cl4sycl6detail13MemoryManager18releaseImageBufferESt10shared_ptrINS1_12context_implEEPv -_ZN2cl4sycl6detail13MemoryManager19wrapIntoImageBufferESt10shared_ptrINS1_12context_implEEPvPNS1_11SYCLMemObjIE _ZN2cl4sycl6detail14getBorderColorENS0_19image_channel_orderE _ZN2cl4sycl6detail14host_half_impl4halfC1ERKf _ZN2cl4sycl6detail14host_half_impl4halfC2ERKf @@ -4044,6 +4048,7 @@ _ZNK2cl4sycl7program7is_hostEv _ZNK2cl4sycl7program8get_infoILNS0_4info7programE4448EEENS3_12param_traitsIS4_XT_EE11return_typeEv _ZNK2cl4sycl7program8get_infoILNS0_4info7programE4449EEENS3_12param_traitsIS4_XT_EE11return_typeEv _ZNK2cl4sycl7program8get_infoILNS0_4info7programE4451EEENS3_12param_traitsIS4_XT_EE11return_typeEv +_ZNK2cl4sycl7program9getNativeEv _ZNK2cl4sycl7program9get_stateEv _ZNK2cl4sycl7sampler18get_filtering_modeEv _ZNK2cl4sycl7sampler19get_addressing_modeEv @@ -4067,9 +4072,3 @@ _ZNK2cl4sycl9exception11has_contextEv _ZNK2cl4sycl9exception4whatEv __sycl_register_lib __sycl_unregister_lib -_ZN2cl4sycl6level011make_deviceERKNS0_8platformEm -_ZN2cl4sycl6level010make_queueERKNS0_7contextEm -_ZN2cl4sycl6level012make_programERKNS0_7contextEm -_ZN2cl4sycl6level013make_platformEm -_ZNK2cl4sycl8platform9getNativeEv -_ZNK2cl4sycl7program9getNativeEv diff --git a/sycl/test/plugins/sycl-ls-gpu-default.cpp b/sycl/test/plugins/sycl-ls-gpu-default.cpp index a07933f2ccff8..a57fc2a39a027 100755 --- a/sycl/test/plugins/sycl-ls-gpu-default.cpp +++ b/sycl/test/plugins/sycl-ls-gpu-default.cpp @@ -1,4 +1,4 @@ -// REQUIRES: gpu, level0 +// REQUIRES: gpu, level_zero // RUN: sycl-ls --verbose >%t.default.out // RUN: FileCheck %s --check-prefixes=CHECK-GPU-BUILTIN,CHECK-GPU-CUSTOM --input-file %t.default.out From e96a951c080aca3e65092a57226dbf139cebbc22 Mon Sep 17 00:00:00 2001 From: Gail Lyons Date: Wed, 15 Jul 2020 08:12:37 -0700 Subject: [PATCH 4/9] Incorporating code review comments Signed-off-by: Gail Lyons --- sycl/plugins/level_zero/CMakeLists.txt | 52 +++++++++++++------------- sycl/source/detail/config.hpp | 7 +--- sycl/tools/CMakeLists.txt | 8 ++-- 3 files changed, 32 insertions(+), 35 deletions(-) diff --git a/sycl/plugins/level_zero/CMakeLists.txt b/sycl/plugins/level_zero/CMakeLists.txt index dd7b7efffb1f3..a3ac89c5bbf0f 100755 --- a/sycl/plugins/level_zero/CMakeLists.txt +++ b/sycl/plugins/level_zero/CMakeLists.txt @@ -1,14 +1,14 @@ # PI Level Zero plugin library if(MSVC) - set(L0_LOADER + set(LEVEL_ZERO_LOADER "${LLVM_LIBRARY_OUTPUT_INTDIR}/${CMAKE_STATIC_LIBRARY_PREFIX}ze_loader${CMAKE_STATIC_LIBRARY_SUFFIX}") else() - set(L0_LOADER + set(LEVEL_ZERO_LOADER "${LLVM_LIBRARY_OUTPUT_INTDIR}/${CMAKE_SHARED_LIBRARY_PREFIX}ze_loader${CMAKE_SHARED_LIBRARY_SUFFIX}") endif() -if (NOT DEFINED L0_LIBRARY OR NOT DEFINED L0_INCLUDE_DIR) +if (NOT DEFINED LEVEL_ZERO_LIBRARY OR NOT DEFINED LEVEL_ZERO_INCLUDE_DIR) message(STATUS "Download Level Zero loader and headers from github.com") if (CMAKE_C_COMPILER) list(APPEND AUX_CMAKE_FLAGS -DCMAKE_C_COMPILER=${CMAKE_C_COMPILER}) @@ -16,18 +16,18 @@ if (NOT DEFINED L0_LIBRARY OR NOT DEFINED L0_INCLUDE_DIR) if (CMAKE_CXX_COMPILER) list(APPEND AUX_CMAKE_FLAGS -DCMAKE_CXX_COMPILER=${CMAKE_CXX_COMPILER}) endif() - file(MAKE_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/l0_loader_build) - set(L0_LOADER_SOURCE_DIR "${CMAKE_CURRENT_BINARY_DIR}/Level0/l0_loader") - if (NOT DEFINED SYCL_EP_L0_LOADER_SKIP_AUTO_UPDATE) - set(SYCL_EP_L0_LOADER_SKIP_AUTO_UPDATE ${SYCL_EXTERNAL_PROJECTS_SKIP_AUTO_UPDATE}) + file(MAKE_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/level_zero_loader_build) + set(LEVEL_ZERO_LOADER_SOURCE_DIR "${CMAKE_CURRENT_BINARY_DIR}/level_zero/level_zero_loader") + if (NOT DEFINED SYCL_EP_LEVEL_ZERO_LOADER_SKIP_AUTO_UPDATE) + set(SYCL_EP_LEVEL_ZERO_LOADER_SKIP_AUTO_UPDATE ${SYCL_EXTERNAL_PROJECTS_SKIP_AUTO_UPDATE}) endif() - ExternalProject_Add(l0-loader + ExternalProject_Add(level-zero-loader GIT_REPOSITORY https://github.com/oneapi-src/level-zero.git GIT_TAG origin/master - UPDATE_DISCONNECTED ${SYCL_EP_L0_LOADER_SKIP_AUTO_UPDATE} - SOURCE_DIR ${L0_LOADER_SOURCE_DIR} - BINARY_DIR "${CMAKE_CURRENT_BINARY_DIR}/l0_loader_build" - INSTALL_DIR "${CMAKE_CURRENT_BINARY_DIR}/l0_loader_install" + UPDATE_DISCONNECTED ${SYCL_EP_LEVEL_ZERO_LOADER_SKIP_AUTO_UPDATE} + SOURCE_DIR ${LEVEL_ZERO_LOADER_SOURCE_DIR} + BINARY_DIR "${CMAKE_CURRENT_BINARY_DIR}/level_zero_loader_build" + INSTALL_DIR "${CMAKE_CURRENT_BINARY_DIR}/level_zero_loader_install" CMAKE_ARGS -DCMAKE_BUILD_TYPE=${CMAKE_BUILD_TYPE} -DCMAKE_MAKE_PROGRAM=${CMAKE_MAKE_PROGRAM} -DOpenCL_INCLUDE_DIR=${OpenCL_INCLUDE_DIRS} @@ -36,31 +36,31 @@ if (NOT DEFINED L0_LIBRARY OR NOT DEFINED L0_INCLUDE_DIR) ${AUX_CMAKE_FLAGS} STEP_TARGETS configure,build,install DEPENDS ocl-headers - BUILD_BYPRODUCTS ${L0_LOADER} + BUILD_BYPRODUCTS ${LEVEL_ZERO_LOADER} ) - ExternalProject_Add_Step(l0-loader llvminstall + ExternalProject_Add_Step(level-zero-loader llvminstall COMMAND ${CMAKE_COMMAND} -E copy_directory / ${LLVM_BINARY_DIR} - COMMENT "Installing l0-loader into the LLVM binary directory" + COMMENT "Installing level-zero-loader into the LLVM binary directory" DEPENDEES install ) - install(DIRECTORY "${CMAKE_CURRENT_BINARY_DIR}/l0_loader_install/" + install(DIRECTORY "${CMAKE_CURRENT_BINARY_DIR}/level_zero_loader_install/" DESTINATION "." - COMPONENT l0-loader + COMPONENT level-zero-loader ) - list(APPEND SYCL_TOOLCHAIN_DEPLOY_COMPONENTS l0-loader) + list(APPEND SYCL_TOOLCHAIN_DEPLOY_COMPONENTS level-zero-loader) else() - include_directories("${L0_INCLUDE_DIR}") - file(GLOB L0_LIBRARY_SRC "${L0_LIBRARY}*") - file(COPY ${L0_LIBRARY_SRC} DESTINATION ${LLVM_LIBRARY_OUTPUT_INTDIR}) - add_custom_target(l0-loader DEPENDS ${L0_LIBRARY} COMMENT "Copying Level Zero Loader ...") + include_directories("${LEVEL_ZERO_INCLUDE_DIR}") + file(GLOB LEVEL_ZERO_LIBRARY_SRC "${LEVEL_ZERO_LIBRARY}*") + file(COPY ${LEVEL_ZERO_LIBRARY_SRC} DESTINATION ${LLVM_LIBRARY_OUTPUT_INTDIR}) + add_custom_target(level-zero-loader DEPENDS ${LEVEL_ZERO_LIBRARY} COMMENT "Copying Level Zero Loader ...") endif() add_library (L0Loader-Headers INTERFACE) add_library (L0Loader::Headers ALIAS L0Loader-Headers) target_include_directories(L0Loader-Headers - INTERFACE "${L0_INCLUDE_DIR}" + INTERFACE "${LEVEL_ZERO_INCLUDE_DIR}" ) include_directories("${sycl_inc_dir}") @@ -92,12 +92,12 @@ else() ) endif() -if (TARGET l0-loader) - add_dependencies(pi_level_zero l0-loader) +if (TARGET level-zero-loader) + add_dependencies(pi_level_zero level-zero-loader) endif() add_dependencies(sycl-toolchain pi_level_zero) - target_link_libraries(pi_level_zero PRIVATE "${L0_LOADER}") + target_link_libraries(pi_level_zero PRIVATE "${LEVEL_ZERO_LOADER}") if (UNIX) target_link_libraries(pi_level_zero PRIVATE pthread) endif() diff --git a/sycl/source/detail/config.hpp b/sycl/source/detail/config.hpp index 09c670152895c..948c91849fc68 100644 --- a/sycl/source/detail/config.hpp +++ b/sycl/source/detail/config.hpp @@ -112,7 +112,6 @@ template <> class SYCLConfig { static backend *get() { static bool Initialized = false; static backend *BackendPtr = nullptr; - const char *newStr = "PI_LEVEL_ZERO"; // Configuration parameters are processed only once, like reading a string // from environment and converting it into a typed object. @@ -120,14 +119,12 @@ template <> class SYCLConfig { return BackendPtr; const char *ValStr = BaseT::getRawValue(); - const std::array, 3> SyclBeMap = { + const std::array, 4> SyclBeMap = { {{"PI_OPENCL", backend::opencl}, {"PI_LEVEL_ZERO", backend::level_zero}, + {"PI_LEVEL0", backend::level_zero}, // for backward compatibility {"PI_CUDA", backend::cuda}}}; if (ValStr) { - if (strcmp(ValStr, "PI_LEVEL0") == 0) { - ValStr = newStr; - } auto It = std::find_if( std::begin(SyclBeMap), std::end(SyclBeMap), [&ValStr](const std::pair &element) { diff --git a/sycl/tools/CMakeLists.txt b/sycl/tools/CMakeLists.txt index 1e2843e0b9385..55a18938d3462 100644 --- a/sycl/tools/CMakeLists.txt +++ b/sycl/tools/CMakeLists.txt @@ -6,13 +6,13 @@ add_subdirectory(sycl-ls) # TODO: move each tool in its own sub-directory add_executable(get_device_count_by_type get_device_count_by_type.cpp) -add_dependencies(get_device_count_by_type ocl-headers ocl-icd l0-loader) +add_dependencies(get_device_count_by_type ocl-headers ocl-icd level-zero-loader) if(MSVC) - set(L0_LIBRARY + set(LEVEL_ZERO_LIBRARY "${LLVM_LIBRARY_OUTPUT_INTDIR}/${CMAKE_STATIC_LIBRARY_PREFIX}ze_loader${CMAKE_STATIC_LIBRARY_SUFFIX}") else() - set(L0_LIBRARY + set(LEVEL_ZERO_LIBRARY "${LLVM_LIBRARY_OUTPUT_INTDIR}/${CMAKE_SHARED_LIBRARY_PREFIX}ze_loader${CMAKE_SHARED_LIBRARY_SUFFIX}") endif() @@ -21,7 +21,7 @@ target_link_libraries(get_device_count_by_type OpenCL::Headers L0Loader::Headers ${OpenCL_LIBRARIES} - ${L0_LIBRARY} + ${LEVEL_ZERO_LIBRARY} $<$:cudadrv> ) target_compile_definitions(get_device_count_by_type From f5083b2a59e5a47bcb9965d3eeb3967e79710cda Mon Sep 17 00:00:00 2001 From: Gail Lyons Date: Thu, 16 Jul 2020 06:48:43 -0700 Subject: [PATCH 5/9] Incorporating code review comments Signed-off-by: Gail Lyons --- sycl/plugins/level_zero/CMakeLists.txt | 6 +++--- sycl/tools/CMakeLists.txt | 2 +- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/sycl/plugins/level_zero/CMakeLists.txt b/sycl/plugins/level_zero/CMakeLists.txt index a3ac89c5bbf0f..7595eee0a8453 100755 --- a/sycl/plugins/level_zero/CMakeLists.txt +++ b/sycl/plugins/level_zero/CMakeLists.txt @@ -57,9 +57,9 @@ else() add_custom_target(level-zero-loader DEPENDS ${LEVEL_ZERO_LIBRARY} COMMENT "Copying Level Zero Loader ...") endif() -add_library (L0Loader-Headers INTERFACE) -add_library (L0Loader::Headers ALIAS L0Loader-Headers) -target_include_directories(L0Loader-Headers +add_library (LevelZeroLoader-Headers INTERFACE) +add_library (LevelZeroLoader::Headers ALIAS LevelZeroLoader-Headers) +target_include_directories(LevelZeroLoader-Headers INTERFACE "${LEVEL_ZERO_INCLUDE_DIR}" ) diff --git a/sycl/tools/CMakeLists.txt b/sycl/tools/CMakeLists.txt index 55a18938d3462..67b0c7329a10b 100644 --- a/sycl/tools/CMakeLists.txt +++ b/sycl/tools/CMakeLists.txt @@ -19,7 +19,7 @@ endif() target_link_libraries(get_device_count_by_type PRIVATE OpenCL::Headers - L0Loader::Headers + LevelZeroLoader::Headers ${OpenCL_LIBRARIES} ${LEVEL_ZERO_LIBRARY} $<$:cudadrv> From 2bae1039227981e91f0a6ba8099e662dbd426145 Mon Sep 17 00:00:00 2001 From: Gail Lyons Date: Fri, 17 Jul 2020 17:48:23 -0700 Subject: [PATCH 6/9] Fixed clang-format issues Signed-off-by: Gail Lyons --- sycl/include/CL/sycl/backend/level_zero.hpp | 4 +- sycl/plugins/level_zero/pi_level_zero.cpp | 61 ++++++++++--------- sycl/plugins/level_zero/pi_level_zero.hpp | 21 ++++--- .../program_manager/program_manager.cpp | 4 +- 4 files changed, 47 insertions(+), 43 deletions(-) mode change 100755 => 100644 sycl/plugins/level_zero/pi_level_zero.hpp diff --git a/sycl/include/CL/sycl/backend/level_zero.hpp b/sycl/include/CL/sycl/backend/level_zero.hpp index 2187525bffa33..e1d0814354229 100644 --- a/sycl/include/CL/sycl/backend/level_zero.hpp +++ b/sycl/include/CL/sycl/backend/level_zero.hpp @@ -32,8 +32,8 @@ template <> struct interop { template struct interop> { + access::target::global_buffer, + access::placeholder::false_t>> { using type = char *; }; diff --git a/sycl/plugins/level_zero/pi_level_zero.cpp b/sycl/plugins/level_zero/pi_level_zero.cpp index 76a799d16ad72..91bc27defebe6 100644 --- a/sycl/plugins/level_zero/pi_level_zero.cpp +++ b/sycl/plugins/level_zero/pi_level_zero.cpp @@ -1,10 +1,10 @@ -//===----------- pi_level_zero.cpp - Level Zero Plugin--------------------------==// +//===-------- pi_level_zero.cpp - Level Zero Plugin --------------------==// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // -//===----------------------------------------------------------------------===// +//===------------------------------------------------------------------===// /// \file pi_level_zero.cpp /// Implementation of Level Zero Plugin. @@ -26,8 +26,8 @@ namespace { -// Controls Level Zero calls serialization to w/a Level Zero driver being not MT ready. -// Recognized values (can be used as a bit mask): +// Controls Level Zero calls serialization to w/a Level Zero driver being not MT +// ready. Recognized values (can be used as a bit mask): enum { ZeSerializeNone = 0, // no locking or blocking (except when SYCL RT requested blocking) @@ -754,7 +754,8 @@ pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, // cl_khr_3d_image_writes - Extension to enable writes to 3D image memory // objects. // - // Hardcoding some extensions we know are supported by all Level Zero devices. + // Hardcoding some extensions we know are supported by all Level Zero + // devices. SupportedExtensions += (ZE_SUPPORTED_EXTENSIONS); if (ZeDeviceKernelProperties.fp16Supported) SupportedExtensions += ("cl_khr_fp16 "); @@ -995,24 +996,24 @@ pi_result piDeviceGetInfo(pi_device Device, pi_device_info ParamName, return ReturnValue(pi_uint64{DoubleFPValue}); } case PI_DEVICE_INFO_IMAGE2D_MAX_WIDTH: - // Until Level Zero provides needed info, hardcode default minimum values required - // by the SYCL specification. + // Until Level Zero provides needed info, hardcode default minimum values + // required by the SYCL specification. return ReturnValue(size_t{8192}); case PI_DEVICE_INFO_IMAGE2D_MAX_HEIGHT: - // Until Level Zero provides needed info, hardcode default minimum values required - // by the SYCL specification. + // Until Level Zero provides needed info, hardcode default minimum values + // required by the SYCL specification. return ReturnValue(size_t{8192}); case PI_DEVICE_INFO_IMAGE3D_MAX_WIDTH: - // Until Level Zero provides needed info, hardcode default minimum values required - // by the SYCL specification. + // Until Level Zero provides needed info, hardcode default minimum values + // required by the SYCL specification. return ReturnValue(size_t{2048}); case PI_DEVICE_INFO_IMAGE3D_MAX_HEIGHT: - // Until Level Zero provides needed info, hardcode default minimum values required - // by the SYCL specification. + // Until Level Zero provides needed info, hardcode default minimum values + // required by the SYCL specification. return ReturnValue(size_t{2048}); case PI_DEVICE_INFO_IMAGE3D_MAX_DEPTH: - // Until Level Zero provides needed info, hardcode default minimum values required - // by the SYCL specification. + // Until Level Zero provides needed info, hardcode default minimum values + // required by the SYCL specification. return ReturnValue(size_t{2048}); case PI_DEVICE_INFO_IMAGE_MAX_BUFFER_SIZE: return ReturnValue(size_t{ZeDeviceImageProperties.maxImageBufferSize}); @@ -1437,9 +1438,9 @@ pi_result piMemBufferCreate(pi_context Context, pi_mem_flags Flags, size_t Size, auto HostPtrOrNull = (Flags & PI_MEM_FLAGS_HOST_PTR_USE) ? pi_cast(HostPtr) : nullptr; try { - *RetMem = new _pi_buffer(Context->Device->Platform, - pi_cast(Ptr) /* Level Zero Memory Handle */, - HostPtrOrNull); + *RetMem = new _pi_buffer( + Context->Device->Platform, + pi_cast(Ptr) /* Level Zero Memory Handle */, HostPtrOrNull); } catch (const std::bad_alloc &) { return PI_OUT_OF_HOST_MEMORY; } catch (...) { @@ -1660,8 +1661,8 @@ pi_result piProgramCreate(pi_context Context, const void *IL, size_t Length, assert(Context); assert(Program); - // NOTE: the Level Zero module creation is also building the program, so we are - // deferring it until the program is ready to be built in piProgramBuild + // NOTE: the Level Zero module creation is also building the program, so we + // are deferring it until the program is ready to be built in piProgramBuild // and piProgramCompile. Also it is only then we know the build options. // ze_module_desc_t ZeModuleDesc = {}; @@ -1796,7 +1797,8 @@ pi_result piProgramLink(pi_context Context, pi_uint32 NumDevices, void (*PFnNotify)(pi_program Program, void *UserData), void *UserData, pi_program *RetProgram) { - // TODO: Level Zero does not [yet] support linking so dummy implementation here. + // TODO: Level Zero does not [yet] support linking so dummy implementation + // here. assert(NumInputPrograms == 1 && InputPrograms); assert(RetProgram); *RetProgram = InputPrograms[0]; @@ -2052,9 +2054,9 @@ pi_result piKernelGetInfo(pi_kernel Kernel, pi_kernel_info ParamName, case PI_KERNEL_INFO_PROGRAM: return ReturnValue(pi_program{Kernel->Program}); case PI_KERNEL_INFO_FUNCTION_NAME: - // TODO: Replace with the line in the comment once bug in the Level Zero driver will - // be fixed. Problem is that currently Level Zero driver truncates name of the - // returned kernel if it is longer than 256 symbols. + // TODO: Replace with the line in the comment once bug in the Level Zero + // driver will be fixed. Problem is that currently Level Zero driver + // truncates name of the returned kernel if it is longer than 256 symbols. // // return ReturnValue(ZeKernelProperties.name); return ReturnValue(Kernel->KernelName.c_str()); @@ -3010,8 +3012,8 @@ piEnqueueMemBufferMap(pi_queue Queue, pi_mem Buffer, pi_bool BlockingMap, ZE_CALL(zeCommandListAppendWaitOnEvents(ZeCommandList, NumEventsInWaitList, ZeEventWaitList)); - // TODO: Level Zero is missing the memory "mapping" capabilities, so we are left - // to doing new memory allocation and a copy (read). + // TODO: Level Zero is missing the memory "mapping" capabilities, so we are + // left to doing new memory allocation and a copy (read). // // TODO: check if the input buffer is already allocated in shared // memory and thus is accessible from the host as is. Can we get SYCL RT @@ -3081,8 +3083,8 @@ pi_result piEnqueueMemUnmap(pi_queue Queue, pi_mem MemObj, void *MappedPtr, ZE_CALL(zeCommandListAppendWaitOnEvents(ZeCommandList, NumEventsInWaitList, ZeEventWaitList)); - // TODO: Level Zero is missing the memory "mapping" capabilities, so we are left - // to doing copy (write back to the device). + // TODO: Level Zero is missing the memory "mapping" capabilities, so we are + // left to doing copy (write back to the device). // // NOTE: Keep this in sync with the implementation of // piEnqueueMemBufferMap/piEnqueueMemImageMap. @@ -3754,7 +3756,8 @@ pi_result piextProgramSetSpecializationConstant(pi_program Prog, // Pass SpecValue pointer. Spec constant value is retrieved // by Level-Zero when creating the modul // - // NOTE: SpecSize is unused in Level Zero, the size is known from SPIR-V by SpecID. + // NOTE: SpecSize is unused in Level Zero, the size is known from SPIR-V by + // SpecID. Prog->ZeSpecConstants[SpecID] = reinterpret_cast(SpecValue); return PI_SUCCESS; diff --git a/sycl/plugins/level_zero/pi_level_zero.hpp b/sycl/plugins/level_zero/pi_level_zero.hpp old mode 100755 new mode 100644 index 7f69f15abcb0b..a3db143a55a48 --- a/sycl/plugins/level_zero/pi_level_zero.hpp +++ b/sycl/plugins/level_zero/pi_level_zero.hpp @@ -1,10 +1,10 @@ -//===---------- pi_level_zero.hpp - Level Zero Plugin -------------------------===// +//===------- pi_level_zero.hpp - Level Zero Plugin -------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // -//===----------------------------------------------------------------------===// +//===-----------------------------------------------------------------===// /// \defgroup sycl_pi_level_zero Level Zero Plugin /// \ingroup sycl_pi @@ -56,13 +56,14 @@ struct _pi_object { std::atomic RefCount; }; -// Define the types that are opaque in pi.h in a manner suitabale for Level Zero plugin +// Define the types that are opaque in pi.h in a manner suitabale for Level Zero +// plugin struct _pi_platform { _pi_platform(ze_driver_handle_t Driver) : ZeDriver{Driver} {} - // Level Zero lacks the notion of a platform, but there is a driver, which is a - // pretty good fit to keep here. + // Level Zero lacks the notion of a platform, but there is a driver, which is + // a pretty good fit to keep here. ze_driver_handle_t ZeDriver; // Cache versions info from zeDriverGetProperties. @@ -89,8 +90,8 @@ struct _pi_device : _pi_object { // PI platform to which this device belongs. pi_platform Platform; - // Immediate Level Zero command list for this device, to be used for initializations. - // To be created as: + // Immediate Level Zero command list for this device, to be used for + // initializations. To be created as: // - Immediate command list: So any command appended to it is immediately // offloaded to the device. // - Synchronous: So implicit synchronization is made inside the level-zero @@ -283,9 +284,9 @@ struct _pi_event : _pi_object { // Level Zero event pool handle. ze_event_pool_handle_t ZeEventPool; - // Level Zero command list where the command signaling this event was appended to. - // This is currently used to remember/destroy the command list after - // all commands in it are completed, i.e. this event signaled. + // Level Zero command list where the command signaling this event was appended + // to. This is currently used to remember/destroy the command list after all + // commands in it are completed, i.e. this event signaled. ze_command_list_handle_t ZeCommandList; // Keeps the command-queue and command associated with the event. diff --git a/sycl/source/detail/program_manager/program_manager.cpp b/sycl/source/detail/program_manager/program_manager.cpp index cd2bd291ac51d..f223047bda2bb 100644 --- a/sycl/source/detail/program_manager/program_manager.cpp +++ b/sycl/source/detail/program_manager/program_manager.cpp @@ -783,8 +783,8 @@ ProgramManager::build(ProgramPtr Program, const ContextImplPtr Context, LinkOpts = LinkOptions.c_str(); } - // Level-Zero plugin doesn't support piProgramCompile/piProgramLink commands, program - // is built during piProgramCreate. + // Level-Zero plugin doesn't support piProgramCompile/piProgramLink commands, + // program is built during piProgramCreate. // TODO: remove this check as soon as piProgramCompile/piProgramLink will be // implemented in Level-Zero plugin. if (Context->getPlugin().getBackend() == backend::level_zero) { From bc2b9ef3ebb5f806de843dde31209c922216a2d2 Mon Sep 17 00:00:00 2001 From: Gail Lyons Date: Wed, 22 Jul 2020 12:01:23 -0700 Subject: [PATCH 7/9] Updated test files; bumped ABI version number Signed-off-by: Gail Lyons --- sycl/CMakeLists.txt | 2 +- sycl/ReleaseNotes.md | 2 +- sycl/test/abi/pi_level_zero_symbol_check.dump | 2 +- sycl/test/abi/sycl_symbols_linux.dump | 16 ++++++---------- .../test/basic_tests/buffer/buffer_full_copy.cpp | 2 +- .../spec_const/spec_const_hw_accelerator.cpp | 2 +- .../spec_const_redefine_accelerator.cpp | 2 +- 7 files changed, 12 insertions(+), 16 deletions(-) diff --git a/sycl/CMakeLists.txt b/sycl/CMakeLists.txt index f635aa35fcad3..15f3b307b6f22 100644 --- a/sycl/CMakeLists.txt +++ b/sycl/CMakeLists.txt @@ -14,7 +14,7 @@ include(AddSYCLExecutable) set(SYCL_MAJOR_VERSION 2) set(SYCL_MINOR_VERSION 1) set(SYCL_PATCH_VERSION 0) -set(SYCL_DEV_ABI_VERSION 1) +set(SYCL_DEV_ABI_VERSION 2) if (SYCL_ADD_DEV_VERSION_POSTFIX) set(SYCL_VERSION_POSTFIX "-${SYCL_DEV_ABI_VERSION}") endif() diff --git a/sycl/ReleaseNotes.md b/sycl/ReleaseNotes.md index 70d30cf3cfd5b..7c6963777fb30 100644 --- a/sycl/ReleaseNotes.md +++ b/sycl/ReleaseNotes.md @@ -62,7 +62,7 @@ Release notes for the commit range ba404be..24726df - Added a cache for PI plugins, so subsequent calls for `sycl::device` creation should be cheaper [03dd60d] - A SYCL program will be aborted now if program linking is requested when - using L0 plugin. This is done because L0 doesn't support program linking + using Level Zero plugin. This is done because L0 doesn't support program linking [d4a5b71] - Added a diagnostic on attempt to use `sycl::program::set_spec_constant` when the program is already in compiled or linked state [e2e3d3d] diff --git a/sycl/test/abi/pi_level_zero_symbol_check.dump b/sycl/test/abi/pi_level_zero_symbol_check.dump index f6bb19aa16a5b..7c8c74b8cc77d 100644 --- a/sycl/test/abi/pi_level_zero_symbol_check.dump +++ b/sycl/test/abi/pi_level_zero_symbol_check.dump @@ -3,7 +3,7 @@ # DO NOT EDIT IT MANUALLY. Refer to sycl/docs/ABIPolicyGuide.md for more info. ################################################################################ -# RUN: env LLVM_BIN_PATH=%llvm_build_bin_dir python %sycl_tools_src_dir/abi_check.py --mode check_symbols --reference %s %sycl_libs_dir/libpi_level0.so +# RUN: env LLVM_BIN_PATH=%llvm_build_bin_dir python %sycl_tools_src_dir/abi_check.py --mode check_symbols --reference %s %sycl_libs_dir/libpi_level_zero.so # REQUIRES: linux piContextCreate diff --git a/sycl/test/abi/sycl_symbols_linux.dump b/sycl/test/abi/sycl_symbols_linux.dump index 724b75de2e18c..0b336464462d3 100644 --- a/sycl/test/abi/sycl_symbols_linux.dump +++ b/sycl/test/abi/sycl_symbols_linux.dump @@ -3625,8 +3625,8 @@ _ZN2cl4sycl5eventC1Ev _ZN2cl4sycl5eventC2EP9_cl_eventRKNS0_7contextE _ZN2cl4sycl5eventC2ESt10shared_ptrINS0_6detail10event_implEE _ZN2cl4sycl5eventC2Ev -_ZN2cl4sycl5intel6detail17reduComputeWGSizeEmmRm _ZN2cl4sycl5intel6detail16reduGetMaxWGSizeESt10shared_ptrINS0_6detail10queue_implEEm +_ZN2cl4sycl5intel6detail17reduComputeWGSizeEmmRm _ZN2cl4sycl5queue10mem_adviseEPKvm14_pi_mem_advice _ZN2cl4sycl5queue10wait_proxyERKNS0_6detail13code_locationE _ZN2cl4sycl5queue11submit_implESt8functionIFvRNS0_7handlerEEERKNS0_6detail13code_locationE @@ -3732,15 +3732,15 @@ _ZN2cl4sycl6detail12sampler_implD2Ev _ZN2cl4sycl6detail12split_stringERKNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEEc _ZN2cl4sycl6detail13MemoryManager12prefetch_usmEPvSt10shared_ptrINS1_10queue_implEEmSt6vectorIP9_pi_eventSaIS9_EERS9_ _ZN2cl4sycl6detail13MemoryManager13releaseMemObjESt10shared_ptrINS1_12context_implEEPNS1_11SYCLMemObjIEPvS8_ -_ZN2cl4sycl6detail13MemoryManager19allocateImageObjectESt10shared_ptrINS1_12context_implEEPvbRK14_pi_image_descRK16_pi_image_formatRKNS0_13property_listE _ZN2cl4sycl6detail13MemoryManager16allocateMemImageESt10shared_ptrINS1_12context_implEEPNS1_11SYCLMemObjIEPvbmRK14_pi_image_descRK16_pi_image_formatRKS3_INS1_10event_implEERKS5_RKNS0_13property_listERP9_pi_event -_ZN2cl4sycl6detail13MemoryManager24allocateInteropMemObjectESt10shared_ptrINS1_12context_implEEPvRKS3_INS1_10event_implEERKS5_RKNS0_13property_listERP9_pi_event -_ZN2cl4sycl6detail13MemoryManager20allocateBufferObjectESt10shared_ptrINS1_12context_implEEPvbmRKNS0_13property_listE +_ZN2cl4sycl6detail13MemoryManager17allocateMemBufferESt10shared_ptrINS1_12context_implEEPNS1_11SYCLMemObjIEPvbmRKS3_INS1_10event_implEERKS5_RKNS0_13property_listERP9_pi_event _ZN2cl4sycl6detail13MemoryManager18allocateHostMemoryEPNS1_11SYCLMemObjIEPvbmRKNS0_13property_listE -_ZN2cl4sycl6detail13MemoryManager19wrapIntoImageBufferESt10shared_ptrINS1_12context_implEEPvPNS1_11SYCLMemObjIE _ZN2cl4sycl6detail13MemoryManager18releaseImageBufferESt10shared_ptrINS1_12context_implEEPv -_ZN2cl4sycl6detail13MemoryManager17allocateMemBufferESt10shared_ptrINS1_12context_implEEPNS1_11SYCLMemObjIEPvbmRKS3_INS1_10event_implEERKS5_RKNS0_13property_listERP9_pi_event +_ZN2cl4sycl6detail13MemoryManager19allocateImageObjectESt10shared_ptrINS1_12context_implEEPvbRK14_pi_image_descRK16_pi_image_formatRKNS0_13property_listE +_ZN2cl4sycl6detail13MemoryManager19wrapIntoImageBufferESt10shared_ptrINS1_12context_implEEPvPNS1_11SYCLMemObjIE +_ZN2cl4sycl6detail13MemoryManager20allocateBufferObjectESt10shared_ptrINS1_12context_implEEPvbmRKNS0_13property_listE _ZN2cl4sycl6detail13MemoryManager20allocateMemSubBufferESt10shared_ptrINS1_12context_implEEPvmmNS0_5rangeILi3EEESt6vectorIS3_INS1_10event_implEESaISB_EERP9_pi_event +_ZN2cl4sycl6detail13MemoryManager24allocateInteropMemObjectESt10shared_ptrINS1_12context_implEEPvRKS3_INS1_10event_implEERKS5_RKNS0_13property_listERP9_pi_event _ZN2cl4sycl6detail13MemoryManager3mapEPNS1_11SYCLMemObjIEPvSt10shared_ptrINS1_10queue_implEENS0_6access4modeEjNS0_5rangeILi3EEESC_NS0_2idILi3EEEjSt6vectorIP9_pi_eventSaISH_EERSH_ _ZN2cl4sycl6detail13MemoryManager4copyEPNS1_11SYCLMemObjIEPvSt10shared_ptrINS1_10queue_implEEjNS0_5rangeILi3EEESA_NS0_2idILi3EEEjS5_S8_jSA_SA_SC_jSt6vectorIP9_pi_eventSaISF_EERSF_ _ZN2cl4sycl6detail13MemoryManager4fillEPNS1_11SYCLMemObjIEPvSt10shared_ptrINS1_10queue_implEEmPKcjNS0_5rangeILi3EEESC_NS0_2idILi3EEEjSt6vectorIP9_pi_eventSaISH_EERSH_ @@ -3795,10 +3795,6 @@ _ZN2cl4sycl6kernelC1EP10_cl_kernelRKNS0_7contextE _ZN2cl4sycl6kernelC1ESt10shared_ptrINS0_6detail11kernel_implEE _ZN2cl4sycl6kernelC2EP10_cl_kernelRKNS0_7contextE _ZN2cl4sycl6kernelC2ESt10shared_ptrINS0_6detail11kernel_implEE -_ZN2cl4sycl6level010make_queueERKNS0_7contextEm -_ZN2cl4sycl6level011make_deviceERKNS0_8platformEm -_ZN2cl4sycl6level012make_programERKNS0_7contextEm -_ZN2cl4sycl6level013make_platformEm _ZN2cl4sycl6mallocEmRKNS0_5queueENS0_3usm5allocE _ZN2cl4sycl6mallocEmRKNS0_6deviceERKNS0_7contextENS0_3usm5allocE _ZN2cl4sycl6opencl10make_queueERKNS0_7contextEm diff --git a/sycl/test/basic_tests/buffer/buffer_full_copy.cpp b/sycl/test/basic_tests/buffer/buffer_full_copy.cpp index 79e69067682d5..2743557f6f971 100644 --- a/sycl/test/basic_tests/buffer/buffer_full_copy.cpp +++ b/sycl/test/basic_tests/buffer/buffer_full_copy.cpp @@ -6,7 +6,7 @@ // RUN: %GPU_RUN_PLACEHOLDER %t2.out // RUN: %ACC_RUN_PLACEHOLDER %t2.out -// XFAIL: level0 +// XFAIL: level_zero //==------------- buffer_full_copy.cpp - SYCL buffer basic test ------------==// // diff --git a/sycl/test/spec_const/spec_const_hw_accelerator.cpp b/sycl/test/spec_const/spec_const_hw_accelerator.cpp index d4eb754065c18..bd7df40ed378a 100644 --- a/sycl/test/spec_const/spec_const_hw_accelerator.cpp +++ b/sycl/test/spec_const/spec_const_hw_accelerator.cpp @@ -12,6 +12,6 @@ // TODO: re-enable after CI drivers are updated to newer which support spec // constants: // XFAIL: linux && opencl && accelerator -// UNSUPPORTED: cuda || level0 +// UNSUPPORTED: cuda || level_zero #include "spec_const_hw.cpp" // RUN: %ACC_RUN_PLACEHOLDER %t.out diff --git a/sycl/test/spec_const/spec_const_redefine_accelerator.cpp b/sycl/test/spec_const/spec_const_redefine_accelerator.cpp index 00ef10f63fdfa..52293f7a953e7 100644 --- a/sycl/test/spec_const/spec_const_redefine_accelerator.cpp +++ b/sycl/test/spec_const/spec_const_redefine_accelerator.cpp @@ -14,6 +14,6 @@ // TODO: re-enable after CI drivers are updated to newer which support spec // constants: // XFAIL: linux && opencl && accelerator -// UNSUPPORTED: cuda || level0 +// UNSUPPORTED: cuda || level_zero #include "spec_const_redefine_accelerator.cpp" // RUN: env SYCL_PI_TRACE=2 %ACC_RUN_PLACEHOLDER %t.out 2>&1 %ACC_CHECK_PLACEHOLDER From 2ab1e0957a73109107dfde4da38fbab66ba3b147 Mon Sep 17 00:00:00 2001 From: Gail Lyons Date: Fri, 24 Jul 2020 12:25:29 -0700 Subject: [PATCH 8/9] Resolved clang-format issue. Signed-off-by: Gail Lyons --- sycl/include/CL/sycl/backend/level_zero.hpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/sycl/include/CL/sycl/backend/level_zero.hpp b/sycl/include/CL/sycl/backend/level_zero.hpp index 9ddfbf70fe4c7..82de4eb4c6a78 100644 --- a/sycl/include/CL/sycl/backend/level_zero.hpp +++ b/sycl/include/CL/sycl/backend/level_zero.hpp @@ -39,8 +39,8 @@ struct interop struct interop> { + access::target::constant_buffer, + access::placeholder::false_t>> { using type = char *; }; From c8479d339cf33fe3825e5064bb3436836f6442f0 Mon Sep 17 00:00:00 2001 From: Gail Lyons Date: Tue, 28 Jul 2020 08:49:04 -0700 Subject: [PATCH 9/9] Updated SYCL ABI version number. Addressed other code review comments. Signed-off-by: Gail Lyons --- sycl/CMakeLists.txt | 2 +- sycl/source/detail/config.hpp | 2 +- sycl/test/basic_tests/image_accessor_readsampler.cpp | 1 - sycl/test/spec_const/spec_const_hw.cpp | 1 - sycl/test/spec_const/spec_const_redefine.cpp | 1 - 5 files changed, 2 insertions(+), 5 deletions(-) diff --git a/sycl/CMakeLists.txt b/sycl/CMakeLists.txt index fa32502e0145d..1b7ae47f7b7fb 100644 --- a/sycl/CMakeLists.txt +++ b/sycl/CMakeLists.txt @@ -14,7 +14,7 @@ include(AddSYCLExecutable) set(SYCL_MAJOR_VERSION 2) set(SYCL_MINOR_VERSION 1) set(SYCL_PATCH_VERSION 0) -set(SYCL_DEV_ABI_VERSION 3) +set(SYCL_DEV_ABI_VERSION 4) if (SYCL_ADD_DEV_VERSION_POSTFIX) set(SYCL_VERSION_POSTFIX "-${SYCL_DEV_ABI_VERSION}") endif() diff --git a/sycl/source/detail/config.hpp b/sycl/source/detail/config.hpp index 948c91849fc68..ac6fe8fbcbd2b 100644 --- a/sycl/source/detail/config.hpp +++ b/sycl/source/detail/config.hpp @@ -15,7 +15,7 @@ #include #include #include -#include +#include #include __SYCL_INLINE_NAMESPACE(cl) { diff --git a/sycl/test/basic_tests/image_accessor_readsampler.cpp b/sycl/test/basic_tests/image_accessor_readsampler.cpp index 078a18fd61f1b..a15e55f2087cd 100644 --- a/sycl/test/basic_tests/image_accessor_readsampler.cpp +++ b/sycl/test/basic_tests/image_accessor_readsampler.cpp @@ -6,7 +6,6 @@ // RUN: %CPU_RUN_PLACEHOLDER %t.out // RUN: %GPU_RUN_PLACEHOLDER %t.out // - //==------------------- image_accessor_readsampler.cpp ---------------------==// //==-----------------image_accessor read API test with sampler--------------==// // diff --git a/sycl/test/spec_const/spec_const_hw.cpp b/sycl/test/spec_const/spec_const_hw.cpp index 0cd68617cf32f..442121353bb73 100644 --- a/sycl/test/spec_const/spec_const_hw.cpp +++ b/sycl/test/spec_const/spec_const_hw.cpp @@ -4,7 +4,6 @@ // RUN: env SYCL_DEVICE_TYPE=HOST %t.out // RUN: %CPU_RUN_PLACEHOLDER %t.out // RUN: %GPU_RUN_PLACEHOLDER %t.out - // //==----------- spec_const_hw.cpp ------------------------------------------==// // diff --git a/sycl/test/spec_const/spec_const_redefine.cpp b/sycl/test/spec_const/spec_const_redefine.cpp index 751db0ee70d26..6883ce5c9d7d6 100644 --- a/sycl/test/spec_const/spec_const_redefine.cpp +++ b/sycl/test/spec_const/spec_const_redefine.cpp @@ -4,7 +4,6 @@ // RUN: env SYCL_DEVICE_TYPE=HOST %t.out // RUN: env SYCL_PI_TRACE=2 %CPU_RUN_PLACEHOLDER %t.out 2>&1 %CPU_CHECK_PLACEHOLDER // RUN: env SYCL_PI_TRACE=2 %GPU_RUN_PLACEHOLDER %t.out 2>&1 %GPU_CHECK_PLACEHOLDER - // //==----------- spec_const_redefine.cpp ------------------------------------==// //