lattice · maddyscientist · Jul 18, 2023 · Jul 19, 2023 · Jul 19, 2023 · Jul 19, 2023
@@ -24,6 +24,12 @@ namespace quda
 
     array<T, n> &operator=(const array<T, n> &) = default;
     array<T, n> &operator=(array<T, n> &&) = default;
+
+    template <typename U> constexpr array<T, n> &operator=(const array<U, n> &other)
+    {
+      for (int i = 0; i < n; i++) data[i] = other[i];
+      return *this;
+    }
   };
 
   template <typename T, int n> std::ostream &operator<<(std::ostream &output, const array<T, n> &a)

@@ -23,48 +23,6 @@ namespace quda
     static constexpr bool V = V_;
   };
 
-  __host__ __device__ inline double set(double &x) { return x; }
-  __host__ __device__ inline double2 set(double2 &x) { return x; }
-  __host__ __device__ inline double3 set(double3 &x) { return x; }
-  __host__ __device__ inline double4 set(double4 &x) { return x; }
-  __host__ __device__ inline void sum(double &a, double &b) { a += b; }
-  __host__ __device__ inline void sum(double2 &a, double2 &b)
-  {
-    a.x += b.x;
-    a.y += b.y;
-  }
-  __host__ __device__ inline void sum(double3 &a, double3 &b)
-  {
-    a.x += b.x;
-    a.y += b.y;
-    a.z += b.z;
-  }
-  __host__ __device__ inline void sum(double4 &a, double4 &b)
-  {
-    a.x += b.x;
-    a.y += b.y;
-    a.z += b.z;
-    a.w += b.w;
-  }
-
-#ifdef QUAD_SUM
-  __host__ __device__ inline double set(doubledouble &a) { return a.head(); }
-  __host__ __device__ inline double2 set(doubledouble2 &a) { return make_double2(a.x.head(), a.y.head()); }
-  __host__ __device__ inline double3 set(doubledouble3 &a) { return make_double3(a.x.head(), a.y.head(), a.z.head()); }
-  __host__ __device__ inline void sum(double &a, doubledouble &b) { a += b.head(); }
-  __host__ __device__ inline void sum(double2 &a, doubledouble2 &b)
-  {
-    a.x += b.x.head();
-    a.y += b.y.head();
-  }
-  __host__ __device__ inline void sum(double3 &a, doubledouble3 &b)
-  {
-    a.x += b.x.head();
-    a.y += b.y.head();
-    a.z += b.z.head();
-  }
-#endif
-
   // Vector types used for AoS load-store on CPU
   template <> struct VectorType<double, 24> {
     using type = array<double, 24>;