[SYCL][CUDA] Fix uses of PI descriptors after renaming (#1310)

steffenlarsen · web-flow · commit 82cb6d8a40ad · 2020-03-14T08:29:59.000+03:00
The CUDA backend cannot currently build due to the renaming of descriptors done in #1239. This PR adjusts the backend to the new descriptor names. Signed-off-by: Steffen Larsen <steffen.larsen@codeplay.com>
diff --git a/sycl/plugins/cuda/pi_cuda.cpp b/sycl/plugins/cuda/pi_cuda.cpp
@@ -713,6 +713,8 @@ pi_result cuda_piContextGetInfo(pi_context context, pi_context_info param_name,
   case PI_CONTEXT_INFO_REFERENCE_COUNT:
     return getInfo(param_value_size, param_value, param_value_size_ret,
                    context->get_reference_count());
+  default:
+    PI_HANDLE_UNKNOWN_PARAM_NAME(param_name);
   }
 
   return PI_OUT_OF_RESOURCES;
@@ -1032,7 +1034,7 @@ pi_result cuda_piDeviceGetInfo(pi_device device, pi_device_info param_name,
   }
   case PI_DEVICE_INFO_LOCAL_MEM_TYPE: {
     return getInfo(param_value_size, param_value, param_value_size_ret,
-                   PI_LOCAL_MEM_TYPE_LOCAL);
+                   PI_DEVICE_LOCAL_MEM_TYPE_LOCAL);
   }
   case PI_DEVICE_INFO_LOCAL_MEM_SIZE: {
     // OpenCL's "local memory" maps most closely to CUDA's "shared memory".
@@ -1073,16 +1075,16 @@ pi_result cuda_piDeviceGetInfo(pi_device device, pi_device_info param_name,
     return getInfo(param_value_size, param_value, param_value_size_ret,
                    size_t{1000u});
   }
-  case PI_DEVICE_INFO_IS_ENDIAN_LITTLE: {
+  case PI_DEVICE_INFO_ENDIAN_LITTLE: {
     return getInfo(param_value_size, param_value, param_value_size_ret, true);
   }
-  case PI_DEVICE_INFO_IS_AVAILABLE: {
+  case PI_DEVICE_INFO_AVAILABLE: {
     return getInfo(param_value_size, param_value, param_value_size_ret, true);
   }
-  case PI_DEVICE_INFO_IS_COMPILER_AVAILABLE: {
+  case PI_DEVICE_INFO_COMPILER_AVAILABLE: {
     return getInfo(param_value_size, param_value, param_value_size_ret, true);
   }
-  case PI_DEVICE_INFO_IS_LINKER_AVAILABLE: {
+  case PI_DEVICE_INFO_LINKER_AVAILABLE: {
     return getInfo(param_value_size, param_value, param_value_size_ret, true);
   }
   case PI_DEVICE_INFO_EXECUTION_CAPABILITIES: {
@@ -1658,8 +1660,8 @@ pi_result cuda_piEnqueueMemBufferWrite(pi_queue command_queue, pi_mem buffer,
         event_wait_list, nullptr);
       
     if (event) {
-      retImplEv = std::unique_ptr<_pi_event>(
-          _pi_event::make_native(PI_COMMAND_MEMBUFFER_WRITE, command_queue));
+      retImplEv = std::unique_ptr<_pi_event>(_pi_event::make_native(
+          PI_COMMAND_TYPE_MEM_BUFFER_WRITE, command_queue));
       retImplEv->start();
     }
 
@@ -1703,8 +1705,8 @@ pi_result cuda_piEnqueueMemBufferRead(pi_queue command_queue, pi_mem buffer,
         event_wait_list, nullptr);
 
     if (retEvent) {
-      retImplEv = std::unique_ptr<_pi_event>(
-          _pi_event::make_native(PI_COMMAND_MEMBUFFER_READ, command_queue));
+      retImplEv = std::unique_ptr<_pi_event>(_pi_event::make_native(
+          PI_COMMAND_TYPE_MEM_BUFFER_READ, command_queue));
       retImplEv->start();
     }
 
@@ -1943,8 +1945,8 @@ pi_result cuda_piEnqueueKernelLaunch(
     auto argIndices = kernel->get_arg_indices();
 
     if (event) {
-      retImplEv = std::unique_ptr<_pi_event>(
-          _pi_event::make_native(PI_COMMAND_KERNEL_LAUNCH, command_queue));
+      retImplEv = std::unique_ptr<_pi_event>(_pi_event::make_native(
+          PI_COMMAND_TYPE_NDRANGE_KERNEL, command_queue));
       retImplEv->start();
     }
 
@@ -2247,15 +2249,15 @@ pi_result cuda_piKernelGetGroupInfo(pi_kernel kernel, pi_device device,
   if (kernel != nullptr) {
 
     switch (param_name) {
-    case PI_KERNEL_GROUP_INFO_SIZE: {
+    case PI_KERNEL_GROUP_INFO_WORK_GROUP_SIZE: {
       int max_threads = 0;
       cl::sycl::detail::pi::assertion(cuFuncGetAttribute(&max_threads,
                                        CU_FUNC_ATTRIBUTE_MAX_THREADS_PER_BLOCK,
                                        kernel->get()) == CUDA_SUCCESS);
       return getInfo(param_value_size, param_value, param_value_size_ret,
                      size_t(max_threads));
     }
-    case PI_KERNEL_COMPILE_GROUP_INFO_SIZE: {
+    case PI_KERNEL_GROUP_INFO_COMPILE_WORK_GROUP_SIZE: {
       // Returns the work-group size specified in the kernel source or IL.
       // If the work-group size is not specified in the kernel source or IL,
       // (0, 0, 0) is returned.
@@ -2266,7 +2268,7 @@ pi_result cuda_piKernelGetGroupInfo(pi_kernel kernel, pi_device device,
       return getInfoArray(3, param_value_size, param_value,
                           param_value_size_ret, group_size);
     }
-    case PI_KERNEL_LOCAL_MEM_SIZE: {
+    case PI_KERNEL_GROUP_INFO_LOCAL_MEM_SIZE: {
       // OpenCL LOCAL == CUDA SHARED
       int bytes = 0;
       cl::sycl::detail::pi::assertion(cuFuncGetAttribute(&bytes,
@@ -2275,7 +2277,7 @@ pi_result cuda_piKernelGetGroupInfo(pi_kernel kernel, pi_device device,
       return getInfo(param_value_size, param_value, param_value_size_ret,
                      pi_uint64(bytes));
     }
-    case PI_KERNEL_PREFERRED_WORK_GROUP_SIZE_MULTIPLE: {
+    case PI_KERNEL_GROUP_INFO_PREFERRED_WORK_GROUP_SIZE_MULTIPLE: {
       // Work groups should be multiples of the warp size
       int warpSize = 0;
       cl::sycl::detail::pi::assertion(
@@ -2284,7 +2286,7 @@ pi_result cuda_piKernelGetGroupInfo(pi_kernel kernel, pi_device device,
       return getInfo(param_value_size, param_value, param_value_size_ret,
                      static_cast<size_t>(warpSize));
     }
-    case PI_KERNEL_PRIVATE_MEM_SIZE: {
+    case PI_KERNEL_GROUP_INFO_PRIVATE_MEM_SIZE: {
       // OpenCL PRIVATE == CUDA LOCAL
       int bytes = 0;
       cl::sycl::detail::pi::assertion(
@@ -2373,7 +2375,7 @@ pi_result cuda_piEventGetInfo(pi_event event, pi_event_info param_name,
   assert(event != nullptr);
 
   switch (param_name) {
-  case PI_EVENT_INFO_QUEUE:
+  case PI_EVENT_INFO_COMMAND_QUEUE:
     return getInfo<pi_queue>(param_value_size, param_value,
                              param_value_size_ret, event->get_queue());
   case PI_EVENT_INFO_COMMAND_TYPE:
@@ -2554,7 +2556,7 @@ pi_result cuda_piEnqueueEventsWait(pi_queue command_queue,
 
     if (event) {
       auto new_event =
-          _pi_event::make_native(PI_COMMAND_EVENTS_WAIT, command_queue);
+          _pi_event::make_native(PI_COMMAND_TYPE_MARKER, command_queue);
       new_event->start();
       new_event->record();
       *event = new_event;
@@ -2648,8 +2650,8 @@ pi_result cuda_piEnqueueMemBufferReadRect(
         event_wait_list, nullptr);
 
     if (retEvent) {
-      retImplEv = std::unique_ptr<_pi_event>(
-          _pi_event::make_native(PI_COMMAND_MEMBUFFER_READ, command_queue));
+      retImplEv = std::unique_ptr<_pi_event>(_pi_event::make_native(
+          PI_COMMAND_TYPE_MEM_BUFFER_READ, command_queue));
       retImplEv->start();
     }
 
@@ -2699,8 +2701,8 @@ pi_result cuda_piEnqueueMemBufferWriteRect(
         event_wait_list, nullptr);
 
     if (retEvent) {
-      retImplEv = std::unique_ptr<_pi_event>(
-          _pi_event::make_native(PI_COMMAND_MEMBUFFER_WRITE, command_queue));
+      retImplEv = std::unique_ptr<_pi_event>(_pi_event::make_native(
+          PI_COMMAND_TYPE_MEM_BUFFER_WRITE, command_queue));
       retImplEv->start();
     }
 
@@ -2754,8 +2756,8 @@ pi_result cuda_piEnqueueMemBufferCopy(pi_queue command_queue, pi_mem src_buffer,
     result = PI_CHECK_ERROR(cuMemcpyDtoDAsync(dst, src, size, stream));
 
     if (event) {
-      auto new_event =
-          _pi_event::make_native(PI_COMMAND_MEMBUFFER_COPY, command_queue);
+      auto new_event = _pi_event::make_native(PI_COMMAND_TYPE_MEM_BUFFER_COPY,
+                                              command_queue);
       new_event->record();
       *event = new_event;
     }
@@ -2792,8 +2794,8 @@ pi_result cuda_piEnqueueMemBufferCopyRect(
                                       event_wait_list, nullptr);
 
     if (event) {
-      retImplEv = std::unique_ptr<_pi_event>(
-          _pi_event::make_native(PI_COMMAND_MEMBUFFER_COPY, command_queue));
+      retImplEv = std::unique_ptr<_pi_event>(_pi_event::make_native(
+          PI_COMMAND_TYPE_MEM_BUFFER_COPY, command_queue));
       retImplEv->start();
     }
 
@@ -2896,8 +2898,8 @@ pi_result cuda_piEnqueueMemBufferFill(pi_queue command_queue, pi_mem buffer,
     }
 
     if (event) {
-      auto new_event =
-          _pi_event::make_native(PI_COMMAND_MEMBUFFER_FILL, command_queue);
+      auto new_event = _pi_event::make_native(PI_COMMAND_TYPE_MEM_BUFFER_FILL,
+                                              command_queue);
       new_event->record();
       *event = new_event;
     }
diff --git a/sycl/plugins/cuda/pi_cuda.hpp b/sycl/plugins/cuda/pi_cuda.hpp
@@ -273,7 +273,7 @@ class _pi_event {
   pi_context get_context() const noexcept { return context_; };
 
   bool is_user_event() const noexcept {
-    return get_command_type() == PI_COMMAND_USER;
+    return get_command_type() == PI_COMMAND_TYPE_USER;
   }
 
   bool is_native_event() const noexcept { return !is_user_event(); }
@@ -297,7 +297,7 @@ class _pi_event {
   // make a user event. CUDA has no concept of user events, so this
   // functionality is implemented by the CUDA PI implementation.
   static pi_event make_user(pi_context context) {
-    return new _pi_event(PI_COMMAND_USER, context, nullptr);
+    return new _pi_event(PI_COMMAND_TYPE_USER, context, nullptr);
   }
 
   // construct a native CUDA. This maps closely to the underlying CUDA event.
diff --git a/sycl/unittests/pi/cuda/test_events.cpp b/sycl/unittests/pi/cuda/test_events.cpp
@@ -83,7 +83,7 @@ TEST_F(DISABLED_CudaEventTests, PICreateEvent) {
 
 TEST_F(DISABLED_CudaEventTests, piGetInfoNativeEvent) {
 
-  auto foo = _pi_event::make_native(PI_COMMAND_KERNEL_LAUNCH, _queue);
+  auto foo = _pi_event::make_native(PI_COMMAND_TYPE_NDRANGE_KERNEL, _queue);
   ASSERT_NE(foo, nullptr);
 
   pi_event_status paramValue = {};

Original file line number	Diff line number	Diff line change
`@@ -273,7 +273,7 @@ class _pi_event {`
`273`	`273`	`pi_context get_context() const noexcept { return context_; };`
`274`	`274`
`275`	`275`	`bool is_user_event() const noexcept {`
`276`		`- return get_command_type() == PI_COMMAND_USER;`
	`276`	`+ return get_command_type() == PI_COMMAND_TYPE_USER;`
`277`	`277`	`}`
`278`	`278`
`279`	`279`	`bool is_native_event() const noexcept { return !is_user_event(); }`
`@@ -297,7 +297,7 @@ class _pi_event {`
`297`	`297`	`// make a user event. CUDA has no concept of user events, so this`
`298`	`298`	`// functionality is implemented by the CUDA PI implementation.`
`299`	`299`	`static pi_event make_user(pi_context context) {`
`300`		`- return new _pi_event(PI_COMMAND_USER, context, nullptr);`
	`300`	`+ return new _pi_event(PI_COMMAND_TYPE_USER, context, nullptr);`
`301`	`301`	`}`
`302`	`302`
`303`	`303`	`// construct a native CUDA. This maps closely to the underlying CUDA event.`