rust-lang
diff --git a/‎coresimd/ppsv/api/arithmetic_reductions.rs
Lines changed: 49 additions & 2 deletions b/‎coresimd/ppsv/api/arithmetic_reductions.rs
Lines changed: 49 additions & 2 deletions
diff --git a/‎coresimd/ppsv/api/bitwise_reductions.rs
Lines changed: 104 additions & 7 deletions b/‎coresimd/ppsv/api/bitwise_reductions.rs
Lines changed: 104 additions & 7 deletions
diff --git a/‎coresimd/ppsv/api/boolean_reductions.rs
Lines changed: 25 additions & 1 deletion b/‎coresimd/ppsv/api/boolean_reductions.rs
Lines changed: 25 additions & 1 deletion
diff --git a/‎coresimd/ppsv/api/minmax_reductions.rs
Lines changed: 47 additions & 2 deletions b/‎coresimd/ppsv/api/minmax_reductions.rs
Lines changed: 47 additions & 2 deletions
diff --git a/‎coresimd/ppsv/api/mod.rs
Lines changed: 1 addition & 1 deletion b/‎coresimd/ppsv/api/mod.rs
Lines changed: 1 addition & 1 deletion
@@ -5,14 +5,61 @@ macro_rules! impl_arithmetic_reductions {
     ($id:ident, $elem_ty:ident) => {
         impl $id {
             /// Lane-wise addition of the vector elements.
+            ///
+            /// FIXME: document guarantees with respect to:
+            ///    * integers: overflow behavior
+            ///    * floats: order and NaNs
+            #[cfg(not(target_arch = "aarch64"))]
             #[inline]
             pub fn sum(self) -> $elem_ty {
-                super::codegen::sum::ReduceAdd::reduce_add(self)
+                use ::coresimd::simd_llvm::simd_reduce_add_ordered;
+                unsafe {
+                    simd_reduce_add_ordered(self, 0 as $elem_ty)
+                }
             }
+            /// Lane-wise addition of the vector elements.
+            ///
+            /// FIXME: document guarantees with respect to:
+            ///    * integers: overflow behavior
+            ///    * floats: order and NaNs
+            #[cfg(target_arch = "aarch64")]
+            #[inline]
+            pub fn sum(self) -> $elem_ty {
+                // FIXME: broken on AArch64
+                let mut x = self.extract(0) as $elem_ty;
+                for i in 1..$id::lanes() {
+                    x += self.extract(i) as $elem_ty;
+                }
+                x
+            }
+
             /// Lane-wise multiplication of the vector elements.
+            ///
+            /// FIXME: document guarantees with respect to:
+            ///    * integers: overflow behavior
+            ///    * floats: order and NaNs
+            #[cfg(not(target_arch = "aarch64"))]
             #[inline]
             pub fn product(self) -> $elem_ty {
-                super::codegen::product::ReduceMul::reduce_mul(self)
+                use ::coresimd::simd_llvm::simd_reduce_mul_ordered;
+                unsafe {
+                    simd_reduce_mul_ordered(self, 1 as $elem_ty)
+                }
+            }
+            /// Lane-wise multiplication of the vector elements.
+            ///
+            /// FIXME: document guarantees with respect to:
+            ///    * integers: overflow behavior
+            ///    * floats: order and NaNs
+            #[cfg(target_arch = "aarch64")]
+            #[inline]
+            pub fn product(self) -> $elem_ty {
+                // FIXME: broken on AArch64
+                let mut x = self.extract(0) as $elem_ty;
+                for i in 1..$id::lanes() {
+                    x *= self.extract(i) as $elem_ty;
+                }
+                x
             }
         }
     }
 
@@ -5,41 +5,138 @@ macro_rules! impl_bitwise_reductions {
     ($id:ident, $elem_ty:ident) => {
         impl $id {
             /// Lane-wise bitwise `and` of the vector elements.
+            #[cfg(not(target_arch = "aarch64"))]
             #[inline]
             pub fn and(self) -> $elem_ty {
-                super::codegen::and::ReduceAnd::reduce_and(self)
+                use ::coresimd::simd_llvm::simd_reduce_and;
+                unsafe {
+                    simd_reduce_and(self)
+                }
             }
+            /// Lane-wise bitwise `and` of the vector elements.
+            #[cfg(target_arch = "aarch64")]
+            #[inline]
+            pub fn and(self) -> $elem_ty {
+                // FIXME: broken on aarch64
+                let mut x = self.extract(0) as $elem_ty;
+                for i in 1..$id::lanes() {
+                    x &= self.extract(i) as $elem_ty;
+                }
+                x
+            }
+
             /// Lane-wise bitwise `or` of the vector elements.
+            #[cfg(not(target_arch = "aarch64"))]
             #[inline]
             pub fn or(self) -> $elem_ty {
-                super::codegen::or::ReduceOr::reduce_or(self)
+                use ::coresimd::simd_llvm::simd_reduce_or;
+                unsafe {
+                    simd_reduce_or(self)
+                }
             }
+            /// Lane-wise bitwise `or` of the vector elements.
+            #[cfg(target_arch = "aarch64")]
+            #[inline]
+            pub fn or(self) -> $elem_ty {
+                // FIXME: broken on aarch64
+                let mut x = self.extract(0) as $elem_ty;
+                for i in 1..$id::lanes() {
+                    x |= self.extract(i) as $elem_ty;
+                }
+                x
+            }
+
             /// Lane-wise bitwise `xor` of the vector elements.
+            #[cfg(not(target_arch = "aarch64"))]
             #[inline]
             pub fn xor(self) -> $elem_ty {
-                super::codegen::xor::ReduceXor::reduce_xor(self)
+                use ::coresimd::simd_llvm::simd_reduce_xor;
+                unsafe {
+                    simd_reduce_xor(self)
+                }
+            }
+            /// Lane-wise bitwise `xor` of the vector elements.
+            #[cfg(target_arch = "aarch64")]
+            #[inline]
+            pub fn xor(self) -> $elem_ty {
+                // FIXME: broken on aarch64
+                let mut x = self.extract(0) as $elem_ty;
+                for i in 1..$id::lanes() {
+                    x ^= self.extract(i) as $elem_ty;
+                }
+                x
             }
         }
     }
 }
 
 macro_rules! impl_bool_bitwise_reductions {
-    ($id:ident, $elem_ty:ident) => {
+    ($id:ident, $elem_ty:ident, $internal_ty:ident) => {
         impl $id {
             /// Lane-wise bitwise `and` of the vector elements.
+            #[cfg(not(target_arch = "aarch64"))]
             #[inline]
             pub fn and(self) -> $elem_ty {
-                super::codegen::and::ReduceAnd::reduce_and(self) !=0
+                use ::coresimd::simd_llvm::simd_reduce_and;
+                unsafe {
+                    let r: $internal_ty = simd_reduce_and(self);
+                    r != 0
+                }
+            }
+            /// Lane-wise bitwise `and` of the vector elements.
+            #[cfg(target_arch = "aarch64")]
+            #[inline]
+            pub fn and(self) -> $elem_ty {
+                // FIXME: broken on aarch64
+                let mut x = self.extract(0) as $elem_ty;
+                for i in 1..$id::lanes() {
+                    x &= self.extract(i) as $elem_ty;
+                }
+                x
+            }
+
+            /// Lane-wise bitwise `or` of the vector elements.
+            #[cfg(not(target_arch = "aarch64"))]
+            #[inline]
+            pub fn or(self) -> $elem_ty {
+                use ::coresimd::simd_llvm::simd_reduce_or;
+                unsafe {
+                    let r: $internal_ty = simd_reduce_or(self);
+                    r != 0
+                }
             }
             /// Lane-wise bitwise `or` of the vector elements.
+            #[cfg(target_arch = "aarch64")]
             #[inline]
             pub fn or(self) -> $elem_ty {
-                super::codegen::or::ReduceOr::reduce_or(self) != 0
+                // FIXME: broken on aarch64
+                let mut x = self.extract(0) as $elem_ty;
+                for i in 1..$id::lanes() {
+                    x |= self.extract(i) as $elem_ty;
+                }
+                x
+            }
+
+            /// Lane-wise bitwise `xor` of the vector elements.
+            #[cfg(not(target_arch = "aarch64"))]
+            #[inline]
+            pub fn xor(self) -> $elem_ty {
+                use ::coresimd::simd_llvm::simd_reduce_xor;
+                unsafe {
+                    let r: $internal_ty = simd_reduce_xor(self);
+                    r != 0
+                }
             }
             /// Lane-wise bitwise `xor` of the vector elements.
+            #[cfg(target_arch = "aarch64")]
             #[inline]
             pub fn xor(self) -> $elem_ty {
-                super::codegen::xor::ReduceXor::reduce_xor(self) != 0
+                // FIXME: broken on aarch64
+                let mut x = self.extract(0) as $elem_ty;
+                for i in 1..$id::lanes() {
+                    x ^= self.extract(i) as $elem_ty;
+                }
+                x
             }
         }
     }
 
@@ -5,19 +5,43 @@ macro_rules! impl_bool_reductions {
     ($id:ident) => {
         impl $id {
             /// Are `all` vector lanes `true`?
+            #[cfg(not(target_arch = "aarch64"))]
             #[inline]
             pub fn all(self) -> bool {
+                use ::coresimd::simd_llvm::simd_reduce_all;
+                unsafe {
+                    simd_reduce_all(self)
+                }
+            }
+            /// Are `all` vector lanes `true`?
+            #[cfg(target_arch = "aarch64")]
+            #[inline]
+            pub fn all(self) -> bool {
+                // FIXME: Broken on AArch64
                 self.and()
             }
+
+            /// Is `any` vector lanes `true`?
+            #[cfg(not(target_arch = "aarch64"))]
+            #[inline]
+            pub fn any(self) -> bool {
+                use ::coresimd::simd_llvm::simd_reduce_any;
+                unsafe {
+                    simd_reduce_any(self)
+                }
+            }
             /// Is `any` vector lanes `true`?
+            #[cfg(target_arch = "aarch64")]
             #[inline]
             pub fn any(self) -> bool {
+                // FIXME: Broken on AArch64
                 self.or()
             }
+
             /// Are `all` vector lanes `false`?
             #[inline]
             pub fn none(self) -> bool {
-                !self.or()
+                !self.any()
             }
         }
     }
 
@@ -5,14 +5,59 @@ macro_rules! impl_minmax_reductions {
     ($id:ident, $elem_ty:ident) => {
         impl $id {
             /// Largest vector value.
+            ///
+            /// FIXME: document behavior for float vectors with NaNs.
+            #[cfg(not(target_arch = "aarch64"))]
             #[inline]
             pub fn max(self) -> $elem_ty {
-                super::codegen::max::ReduceMax::reduce_max(self)
+                use ::coresimd::simd_llvm::simd_reduce_max;
+                unsafe {
+                    simd_reduce_max(self)
+                }
+            }
+            /// Largest vector value.
+            ///
+            /// FIXME: document behavior for float vectors with NaNs.
+            #[cfg(target_arch = "aarch64")]
+            #[allow(unused_imports)]
+            #[inline]
+            pub fn max(self) -> $elem_ty {
+                // FIXME: broken on AArch64
+                use ::num::Float;
+                use ::cmp::Ord;
+                let mut x = self.extract(0);
+                for i in 1..$id::lanes() {
+                    x = x.max(self.extract(i));
+                }
+                x
+            }
+
+            /// Smallest vector value.
+            ///
+            /// FIXME: document behavior for float vectors with NaNs.
+            #[cfg(not(target_arch = "aarch64"))]
+            #[inline]
+            pub fn min(self) -> $elem_ty {
+                use ::coresimd::simd_llvm::simd_reduce_min;
+                unsafe {
+                    simd_reduce_min(self)
+                }
             }
             /// Smallest vector value.
+            ///
+            /// FIXME: document behavior for float vectors with NaNs.
+            #[cfg(target_arch = "aarch64")]
+            #[allow(unused_imports)]
             #[inline]
             pub fn min(self) -> $elem_ty {
-                super::codegen::min::ReduceMin::reduce_min(self)
+                // FIXME: broken on AArch64
+                use ::num::Float;
+                use ::cmp::Ord;
+                let mut x = self.extract(0);
+                for i in 1..$id::lanes() {
+                    x = x.min(self.extract(i));
+                }
+                x
             }
         }
     }
 
@@ -244,7 +244,7 @@ macro_rules! simd_b_ty {
             [define_ty, $id, $($elem_tys),+ | $(#[$doc])*],
             [impl_bool_minimal, $id, $elem_ty, $elem_count, $($elem_name),*],
             [impl_bitwise_ops, $id, true],
-            [impl_bool_bitwise_reductions, $id, bool],
+            [impl_bool_bitwise_reductions, $id, bool, $elem_ty],
             [impl_bool_reductions, $id],
             [impl_bool_cmp, $id, $id],
             [impl_eq, $id],