pytorch
diff --git a/‎aten/src/ATen/cpu/vec/sve/vec_bfloat16.h
Lines changed: 3 additions & 0 deletions b/‎aten/src/ATen/cpu/vec/sve/vec_bfloat16.h
Lines changed: 3 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec/sve/vec_double.h
Lines changed: 3 additions & 0 deletions b/‎aten/src/ATen/cpu/vec/sve/vec_double.h
Lines changed: 3 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec/sve/vec_float.h
Lines changed: 3 additions & 0 deletions b/‎aten/src/ATen/cpu/vec/sve/vec_float.h
Lines changed: 3 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec/sve/vec_int.h
Lines changed: 3 additions & 0 deletions b/‎aten/src/ATen/cpu/vec/sve/vec_int.h
Lines changed: 3 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec/sve/vec_qint.h
Lines changed: 9 additions & 0 deletions b/‎aten/src/ATen/cpu/vec/sve/vec_qint.h
Lines changed: 9 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec/vec128/vec128_bfloat16_neon.h
Lines changed: 3 additions & 0 deletions b/‎aten/src/ATen/cpu/vec/vec128/vec128_bfloat16_neon.h
Lines changed: 3 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec/vec128/vec128_float_neon.h
Lines changed: 3 additions & 0 deletions b/‎aten/src/ATen/cpu/vec/vec128/vec128_float_neon.h
Lines changed: 3 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec/vec128/vec128_half_neon.h
Lines changed: 3 additions & 0 deletions b/‎aten/src/ATen/cpu/vec/vec128/vec128_half_neon.h
Lines changed: 3 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec/vec256/vec256_bfloat16.h
Lines changed: 3 additions & 0 deletions b/‎aten/src/ATen/cpu/vec/vec256/vec256_bfloat16.h
Lines changed: 3 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec/vec256/vec256_complex_double.h
Lines changed: 4 additions & 0 deletions b/‎aten/src/ATen/cpu/vec/vec256/vec256_complex_double.h
Lines changed: 4 additions & 0 deletions
@@ -20,6 +20,9 @@ inline namespace CPU_CAPABILITY {
 
 #if defined(CPU_CAPABILITY_SVE256) && defined(__ARM_FEATURE_BF16)
 
+template <>
+struct is_vec_specialized_for<BFloat16> : std::bool_constant<true> {};
+
 template <>
 class Vectorized<BFloat16> {
  private:
 
@@ -24,6 +24,9 @@ inline namespace CPU_CAPABILITY {
 
 #if defined(CPU_CAPABILITY_SVE)
 
+template <>
+struct is_vec_specialized_for<double> : std::bool_constant<true> {};
+
 template <>
 class Vectorized<double> {
  private:
 
@@ -24,6 +24,9 @@ inline namespace CPU_CAPABILITY {
 
 #if defined(CPU_CAPABILITY_SVE)
 
+template <>
+struct is_vec_specialized_for<float> : std::bool_constant<true> {};
+
 template <>
 class Vectorized<float> {
  private:
 
@@ -19,6 +19,9 @@ inline namespace CPU_CAPABILITY {
 
 #define VEC_INT_SVE_TEMPLATE(vl, bit)                                         \
   template <>                                                                 \
+  struct is_vec_specialized_for<int##bit##_t> : std::bool_constant<true> {};  \
+                                                                              \
+  template <>                                                                 \
   class Vectorized<int##bit##_t> {                                            \
    private:                                                                   \
     vls_int##bit##_t values;                                                  \
 
@@ -142,6 +142,9 @@ struct VectorizedQuantizedConverter {
   VectorizedQuantizedConverter() {}
 };
 
+template <>
+struct is_vec_specialized_for<c10::qint32> : std::bool_constant<true> {};
+
 template <>
 struct Vectorized<c10::qint32> : public VectorizedQuantizedConverter<
                                      c10::qint32,
@@ -302,6 +305,9 @@ Vectorized<c10::qint32> inline operator+(
   return retval;
 }
 
+template <>
+struct is_vec_specialized_for<c10::qint8> : std::bool_constant<true> {};
+
 template <>
 struct Vectorized<c10::qint8> : public VectorizedQuantizedConverter<
                                     c10::qint8,
@@ -442,6 +448,9 @@ Vectorized<c10::qint8> inline maximum(
   return a.maximum(b);
 }
 
+template <>
+struct is_vec_specialized_for<c10::quint8> : std::bool_constant<true> {};
+
 template <>
 struct Vectorized<c10::quint8> : public VectorizedQuantizedConverter<
                                      c10::quint8,
 
@@ -128,6 +128,9 @@ struct BlendBFloat16Regs<index, false> {
   }
 };
 
+template <>
+struct is_vec_specialized_for<c10::BFloat16> : std::bool_constant<true> {};
+
 template <>
 class Vectorized<c10::BFloat16> : public Vectorized16<
                                       at_bfloat16x8_t,
 
@@ -69,6 +69,9 @@ struct BlendRegs<index, false> {
   }
 };
 
+template <>
+struct is_vec_specialized_for<float> : std::bool_constant<true> {};
+
 template <>
 class Vectorized<float> {
  private:
 
@@ -58,6 +58,9 @@ struct BlendHalfRegs<index, false> {
   }
 };
 
+template <>
+struct is_vec_specialized_for<c10::Half> : std::bool_constant<true> {};
+
 // On ARM, Half type supports float16_t->Half constructor and Half->float16_t
 // conversion
 template <>
 
@@ -12,6 +12,9 @@ inline namespace CPU_CAPABILITY {
 
 #if defined(CPU_CAPABILITY_AVX2)
 
+template <>
+struct is_vec_specialized_for<BFloat16> : std::bool_constant<true> {};
+
 template <>
 class Vectorized<BFloat16> : public Vectorized16<BFloat16> {
  public:
 
@@ -19,6 +19,10 @@ inline namespace CPU_CAPABILITY {
 
 #if defined(CPU_CAPABILITY_AVX2)
 
+template <>
+struct is_vec_specialized_for<c10::complex<double>> : std::bool_constant<true> {
+};
+
 template <>
 class Vectorized<c10::complex<double>> {
  private:
Original file line number	Diff line number	Diff line change
`@@ -128,6 +128,9 @@ struct BlendBFloat16Regs<index, false> {`
`128`	`128`	`}`
`129`	`129`	`};`
`130`	`130`
	`131`	`+template <>`
	`132`	`+struct is_vec_specialized_for<c10::BFloat16> : std::bool_constant<true> {};`
	`133`	`+`
`131`	`134`	`template <>`
`132`	`135`	`class Vectorized<c10::BFloat16> : public Vectorized16<`
`133`	`136`	`at_bfloat16x8_t,`
Original file line number	Diff line number	Diff line change
`@@ -69,6 +69,9 @@ struct BlendRegs<index, false> {`
`69`	`69`	`}`
`70`	`70`	`};`
`71`	`71`
	`72`	`+template <>`
	`73`	`+struct is_vec_specialized_for<float> : std::bool_constant<true> {};`
	`74`	`+`
`72`	`75`	`template <>`
`73`	`76`	`class Vectorized<float> {`
`74`	`77`	`private:`
Original file line number	Diff line number	Diff line change
`@@ -58,6 +58,9 @@ struct BlendHalfRegs<index, false> {`
`58`	`58`	`}`
`59`	`59`	`};`
`60`	`60`
	`61`	`+template <>`
	`62`	`+struct is_vec_specialized_for<c10::Half> : std::bool_constant<true> {};`
	`63`	`+`
`61`	`64`	`// On ARM, Half type supports float16_t->Half constructor and Half->float16_t`
`62`	`65`	`// conversion`
`63`	`66`	`template <>`