update sycl_ext_complex

For some reason the gtensor specified AssignN kernel names were missing the second sycl_cplx::complex type arg, and failed to compile. Using only the to_kernel types fixes the issue, and also makes the names more compact and easier to read. I don't think they are actually necessary to avoid duplication, the kernel types alone should be unique.
wdmapp · Jan 18, 2023 · 05b0bc2 · 05b0bc2
1 parent 3ecb09a
commit 05b0bc2
Show file tree

Hide file tree

Showing 4 changed files with 346 additions and 707 deletions.
diff --git a/include/gtensor/assign.h b/include/gtensor/assign.h
@@ -401,7 +401,7 @@ struct assigner<1, space::device>
     auto e = q.submit([&](sycl::handler& cgh) {
       using ltype = decltype(k_lhs);
       using rtype = decltype(k_rhs);
-      using kname = gt::backend::sycl::Assign1<E1, E2, ltype, rtype>;
+      using kname = gt::backend::sycl::Assign1<ltype, rtype>;
       cgh.parallel_for<kname>(range, [=](sycl::item<1> item) {
         auto i = item.get_id();
         k_lhs(i) = k_rhs(i);
@@ -427,7 +427,7 @@ struct assigner<2, space::device>
     auto e = q.submit([&](sycl::handler& cgh) {
       using ltype = decltype(k_lhs);
       using rtype = decltype(k_rhs);
-      using kname = gt::backend::sycl::Assign2<E1, E2, ltype, rtype>;
+      using kname = gt::backend::sycl::Assign2<ltype, rtype>;
       cgh.parallel_for<kname>(range, [=](sycl::item<2> item) {
         auto i = item.get_id(1);
         auto j = item.get_id(0);
@@ -454,7 +454,7 @@ struct assigner<3, space::device>
     auto e = q.submit([&](sycl::handler& cgh) {
       using ltype = decltype(k_lhs);
       using rtype = decltype(k_rhs);
-      using kname = gt::backend::sycl::Assign3<E1, E2, ltype, rtype>;
+      using kname = gt::backend::sycl::Assign3<ltype, rtype>;
       cgh.parallel_for<kname>(range, [=](sycl::item<3> item) {
         auto i = item.get_id(2);
         auto j = item.get_id(1);
@@ -493,16 +493,16 @@ struct assigner<N, space::device>
       q.copy(&k_rhs, d_rhs_p, 1).wait();
 
       auto e = q.submit([&](sycl::handler& cgh) {
-        using kname = gt::backend::sycl::AssignN<E1, E2, ltype, rtype>;
-        cgh.parallel_for<kname>(sycl::range<1>(size), [=](sycl::id<1> i) {
+        using kname = gt::backend::sycl::AssignN<ltype, rtype>;
+        cgh.parallel_for(sycl::range<1>(size), [=](sycl::id<1> i) {
           auto idx = unravel(i, strides);
           index_expression(k_lhs, idx) = index_expression(*d_rhs_p, idx);
         });
       });
     } else {
       auto e = q.submit([&](sycl::handler& cgh) {
-        using kname = gt::backend::sycl::AssignN<E1, E2, ltype, rtype>;
-        cgh.parallel_for<kname>(sycl::range<1>(size), [=](sycl::id<1> i) {
+        using kname = gt::backend::sycl::AssignN<ltype, rtype>;
+        cgh.parallel_for(sycl::range<1>(size), [=](sycl::id<1> i) {
           auto idx = unravel(i, strides);
           index_expression(k_lhs, idx) = index_expression(k_rhs, idx);
         });

diff --git a/include/gtensor/backend_sycl.h b/include/gtensor/backend_sycl.h
@@ -24,13 +24,13 @@ namespace sycl
 {
 
 // kernel name templates
-template <typename E1, typename E2, typename K1, typename K2>
+template <typename K1, typename K2>
 class Assign1;
-template <typename E1, typename E2, typename K1, typename K2>
+template <typename K1, typename K2>
 class Assign2;
-template <typename E1, typename E2, typename K1, typename K2>
+template <typename K1, typename K2>
 class Assign3;
-template <typename E1, typename E2, typename K1, typename K2>
+template <typename K1, typename K2>
 class AssignN;
 
 template <typename F>

diff --git a/include/gtensor/complex.h b/include/gtensor/complex.h
@@ -29,7 +29,7 @@ using complex = thrust::complex<T>;
 
 // TODO: this will hopefully be standardized soon and be sycl::complex
 template <typename T>
-using complex = gt::sycl_cplx::complex<T>;
+using complex = gt::sycl_cplx::complex<T, void>;
 
 #else // fallback to std::complex, e.g. for host backend