rust-lang
diff --git a/‎library/core/src/slice/mod.rs
Lines changed: 1 addition & 1 deletion b/‎library/core/src/slice/mod.rs
Lines changed: 1 addition & 1 deletion
diff --git a/‎library/portable-simd/beginners-guide.md
Lines changed: 2 additions & 2 deletions b/‎library/portable-simd/beginners-guide.md
Lines changed: 2 additions & 2 deletions
diff --git a/‎library/portable-simd/crates/core_simd/Cargo.toml
Lines changed: 1 addition & 1 deletion b/‎library/portable-simd/crates/core_simd/Cargo.toml
Lines changed: 1 addition & 1 deletion
diff --git a/‎library/portable-simd/crates/core_simd/examples/matrix_inversion.rs
Lines changed: 1 addition & 1 deletion b/‎library/portable-simd/crates/core_simd/examples/matrix_inversion.rs
Lines changed: 1 addition & 1 deletion
diff --git a/‎library/portable-simd/crates/core_simd/examples/nbody.rs
Lines changed: 4 additions & 4 deletions b/‎library/portable-simd/crates/core_simd/examples/nbody.rs
Lines changed: 4 additions & 4 deletions
diff --git a/‎library/portable-simd/crates/core_simd/examples/spectral_norm.rs
Lines changed: 2 additions & 2 deletions b/‎library/portable-simd/crates/core_simd/examples/spectral_norm.rs
Lines changed: 2 additions & 2 deletions
diff --git a/‎library/portable-simd/crates/core_simd/src/comparisons.rs
Lines changed: 52 additions & 0 deletions b/‎library/portable-simd/crates/core_simd/src/comparisons.rs
Lines changed: 52 additions & 0 deletions
diff --git a/‎library/portable-simd/crates/core_simd/src/intrinsics.rs
Lines changed: 8 additions & 1 deletion b/‎library/portable-simd/crates/core_simd/src/intrinsics.rs
Lines changed: 8 additions & 1 deletion
diff --git a/‎library/portable-simd/crates/core_simd/src/lib.rs
Lines changed: 1 addition & 2 deletions b/‎library/portable-simd/crates/core_simd/src/lib.rs
Lines changed: 1 addition & 2 deletions
diff --git a/‎library/portable-simd/crates/core_simd/src/masks/to_bitmask.rs
Lines changed: 3 additions & 0 deletions b/‎library/portable-simd/crates/core_simd/src/masks/to_bitmask.rs
Lines changed: 3 additions & 0 deletions
@@ -3536,7 +3536,7 @@ impl<T> [T] {
     ///         suffix.iter().copied().sum(),
     ///     ]);
     ///     let sums = middle.iter().copied().fold(sums, f32x4::add);
-    ///     sums.horizontal_sum()
+    ///     sums.reduce_sum()
     /// }
     ///
     /// let numbers: Vec<f32> = (1..101).map(|x| x as _).collect();
 
@@ -33,7 +33,7 @@ SIMD has a few special vocabulary terms you should know:
 
 * **Vertical:** When an operation is "vertical", each lane processes individually without regard to the other lanes in the same vector. For example, a "vertical add" between two vectors would add lane 0 in `a` with lane 0 in `b`, with the total in lane 0 of `out`, and then the same thing for lanes 1, 2, etc. Most SIMD operations are vertical operations, so if your problem is a vertical problem then you can probably solve it with SIMD.
 
-* **Horizontal:** When an operation is "horizontal", the lanes within a single vector interact in some way. A "horizontal add" might add up lane 0 of `a` with lane 1 of `a`, with the total in lane 0 of `out`.
+* **Reducing/Reduce:** When an operation is "reducing" (functions named `reduce_*`), the lanes within a single vector are merged using some operation such as addition, returning the merged value as a scalar. For instance, a reducing add would return the sum of all the lanes' values.
 
 * **Target Feature:** Rust calls a CPU architecture extension a `target_feature`. Proper SIMD requires various CPU extensions to be enabled (details below). Don't confuse this with `feature`, which is a Cargo crate concept.
 
@@ -83,4 +83,4 @@ Fortunately, most SIMD types have a fairly predictable size. `i32x4` is bit-equi
 However, this is not the same as alignment. Computer architectures generally prefer aligned accesses, especially when moving data between memory and vector registers, and while some support specialized operations that can bend the rules to help with this, unaligned access is still typically slow, or even undefined behavior. In addition, different architectures can require different alignments when interacting with their native SIMD types. For this reason, any `#[repr(simd)]` type has a non-portable alignment. If it is necessary to directly interact with the alignment of these types, it should be via [`mem::align_of`].
 
 [`mem::transmute`]: https://doc.rust-lang.org/core/mem/fn.transmute.html
-[`mem::align_of`]: https://doc.rust-lang.org/core/mem/fn.align_of.html
+[`mem::align_of`]: https://doc.rust-lang.org/core/mem/fn.align_of.html
@@ -9,7 +9,7 @@ categories = ["hardware-support", "no-std"]
 license = "MIT OR Apache-2.0"
 
 [features]
-default = ["std", "generic_const_exprs"]
+default = []
 std = []
 generic_const_exprs = []
 
 
@@ -233,7 +233,7 @@ pub fn simd_inv4x4(m: Matrix4x4) -> Option<Matrix4x4> {
     let det = det.rotate_lanes_right::<2>() + det;
     let det = det.reverse().rotate_lanes_right::<2>() + det;
 
-    if det.horizontal_sum() == 0. {
+    if det.reduce_sum() == 0. {
         return None;
     }
     // calculate the reciprocal
 
@@ -107,10 +107,10 @@ mod nbody {
         let mut e = 0.;
         for i in 0..N_BODIES {
             let bi = &bodies[i];
-            e += bi.mass * (bi.v * bi.v).horizontal_sum() * 0.5;
+            e += bi.mass * (bi.v * bi.v).reduce_sum() * 0.5;
             for bj in bodies.iter().take(N_BODIES).skip(i + 1) {
                 let dx = bi.x - bj.x;
-                e -= bi.mass * bj.mass / (dx * dx).horizontal_sum().sqrt()
+                e -= bi.mass * bj.mass / (dx * dx).reduce_sum().sqrt()
             }
         }
         e
@@ -134,8 +134,8 @@ mod nbody {
         let mut mag = [0.0; N];
         for i in (0..N).step_by(2) {
             let d2s = f64x2::from_array([
-                (r[i] * r[i]).horizontal_sum(),
-                (r[i + 1] * r[i + 1]).horizontal_sum(),
+                (r[i] * r[i]).reduce_sum(),
+                (r[i + 1] * r[i + 1]).reduce_sum(),
             ]);
             let dmags = f64x2::splat(dt) / (d2s * d2s.sqrt());
             mag[i] = dmags[0];
 
@@ -20,7 +20,7 @@ fn mult_av(v: &[f64], out: &mut [f64]) {
             sum += b / a;
             j += 2
         }
-        *out = sum.horizontal_sum();
+        *out = sum.reduce_sum();
     }
 }
 
@@ -38,7 +38,7 @@ fn mult_atv(v: &[f64], out: &mut [f64]) {
             sum += b / a;
             j += 2
         }
-        *out = sum.horizontal_sum();
+        *out = sum.reduce_sum();
     }
 }
 
 
@@ -66,3 +66,55 @@ where
         unsafe { Mask::from_int_unchecked(intrinsics::simd_ge(self, other)) }
     }
 }
+
+macro_rules! impl_ord_methods_vector {
+    { $type:ty } => {
+        impl<const LANES: usize> Simd<$type, LANES>
+        where
+            LaneCount<LANES>: SupportedLaneCount,
+        {
+            /// Returns the lane-wise minimum with `other`.
+            #[must_use = "method returns a new vector and does not mutate the original value"]
+            #[inline]
+            pub fn min(self, other: Self) -> Self {
+                self.lanes_gt(other).select(other, self)
+            }
+
+            /// Returns the lane-wise maximum with `other`.
+            #[must_use = "method returns a new vector and does not mutate the original value"]
+            #[inline]
+            pub fn max(self, other: Self) -> Self {
+                self.lanes_lt(other).select(other, self)
+            }
+
+            /// Restrict each lane to a certain interval.
+            ///
+            /// For each lane, returns `max` if `self` is greater than `max`, and `min` if `self` is
+            /// less than `min`. Otherwise returns `self`.
+            ///
+            /// # Panics
+            ///
+            /// Panics if `min > max` on any lane.
+            #[must_use = "method returns a new vector and does not mutate the original value"]
+            #[inline]
+            pub fn clamp(self, min: Self, max: Self) -> Self {
+                assert!(
+                    min.lanes_le(max).all(),
+                    "each lane in `min` must be less than or equal to the corresponding lane in `max`",
+                );
+                self.max(min).min(max)
+            }
+        }
+    }
+}
+
+impl_ord_methods_vector!(i8);
+impl_ord_methods_vector!(i16);
+impl_ord_methods_vector!(i32);
+impl_ord_methods_vector!(i64);
+impl_ord_methods_vector!(isize);
+impl_ord_methods_vector!(u8);
+impl_ord_methods_vector!(u16);
+impl_ord_methods_vector!(u32);
+impl_ord_methods_vector!(u64);
+impl_ord_methods_vector!(usize);
@@ -18,7 +18,6 @@
 //!
 //! Unless stated otherwise, all intrinsics for binary operations require SIMD vectors of equal types and lengths.
 
-
 // These intrinsics aren't linked directly from LLVM and are mostly undocumented, however they are
 // mostly lowered to the matching LLVM instructions by the compiler in a fairly straightforward manner.
 // The associated LLVM instruction or intrinsic is documented alongside each Rust intrinsic function.
@@ -130,6 +129,14 @@ extern "platform-intrinsic" {
     pub(crate) fn simd_reduce_xor<T, U>(x: T) -> U;
 
     // truncate integer vector to bitmask
+    // `fn simd_bitmask(vector) -> unsigned integer` takes a vector of integers and
+    // returns either an unsigned integer or array of `u8`.
+    // Every element in the vector becomes a single bit in the returned bitmask.
+    // If the vector has less than 8 lanes, a u8 is returned with zeroed trailing bits.
+    // The bit order of the result depends on the byte endianness. LSB-first for little
+    // endian and MSB-first for big endian.
+    //
+    // UB if called on a vector with values other than 0 and -1.
     #[allow(unused)]
     pub(crate) fn simd_bitmask<T, U>(x: T) -> U;
 
 
@@ -1,6 +1,5 @@
-#![cfg_attr(not(feature = "std"), no_std)]
+#![no_std]
 #![feature(
-    const_fn_trait_bound,
     convert_float_to_int,
     decl_macro,
     intra_doc_pointers,
 
@@ -50,6 +50,9 @@ macro_rules! impl_integer_intrinsic {
 }
 
 impl_integer_intrinsic! {
+    unsafe impl ToBitMask<BitMask=u8> for Mask<_, 1>
+    unsafe impl ToBitMask<BitMask=u8> for Mask<_, 2>
+    unsafe impl ToBitMask<BitMask=u8> for Mask<_, 4>
     unsafe impl ToBitMask<BitMask=u8> for Mask<_, 8>
     unsafe impl ToBitMask<BitMask=u16> for Mask<_, 16>
     unsafe impl ToBitMask<BitMask=u32> for Mask<_, 32>
Original file line number	Diff line number	Diff line change
`@@ -233,7 +233,7 @@ pub fn simd_inv4x4(m: Matrix4x4) -> Option<Matrix4x4> {`
`233`	`233`	`let det = det.rotate_lanes_right::<2>() + det;`
`234`	`234`	`let det = det.reverse().rotate_lanes_right::<2>() + det;`
`235`	`235`
`236`		`- if det.horizontal_sum() == 0. {`
	`236`	`+ if det.reduce_sum() == 0. {`
`237`	`237`	`return None;`
`238`	`238`	`}`
`239`	`239`	`// calculate the reciprocal`
Original file line number	Diff line number	Diff line change
`@@ -20,7 +20,7 @@ fn mult_av(v: &[f64], out: &mut [f64]) {`
`20`	`20`	`sum += b / a;`
`21`	`21`	`j += 2`
`22`	`22`	`}`
`23`		`- *out = sum.horizontal_sum();`
	`23`	`+ *out = sum.reduce_sum();`
`24`	`24`	`}`
`25`	`25`	`}`
`26`	`26`
`@@ -38,7 +38,7 @@ fn mult_atv(v: &[f64], out: &mut [f64]) {`
`38`	`38`	`sum += b / a;`
`39`	`39`	`j += 2`
`40`	`40`	`}`
`41`		`- *out = sum.horizontal_sum();`
	`41`	`+ *out = sum.reduce_sum();`
`42`	`42`	`}`
`43`	`43`	`}`
`44`	`44`
Original file line number	Diff line number	Diff line change
`@@ -50,6 +50,9 @@ macro_rules! impl_integer_intrinsic {`
`50`	`50`	`}`
`51`	`51`
`52`	`52`	`impl_integer_intrinsic! {`
	`53`	`+ unsafe impl ToBitMask<BitMask=u8> for Mask<_, 1>`
	`54`	`+ unsafe impl ToBitMask<BitMask=u8> for Mask<_, 2>`
	`55`	`+ unsafe impl ToBitMask<BitMask=u8> for Mask<_, 4>`
`53`	`56`	`unsafe impl ToBitMask<BitMask=u8> for Mask<_, 8>`
`54`	`57`	`unsafe impl ToBitMask<BitMask=u16> for Mask<_, 16>`
`55`	`58`	`unsafe impl ToBitMask<BitMask=u32> for Mask<_, 32>`