Introduce SimdCvt trait family

Ralith · Ralith · commit d26ca59b3489 · 2025-07-10T17:42:32.000-07:00
diff --git a/fearless_simd/src/generated/simd_trait.rs b/fearless_simd/src/generated/simd_trait.rs
@@ -1,20 +1,22 @@
 // This file is autogenerated by fearless_simd_gen
 
-use crate::{Level, SimdElement, SimdInto, seal::Seal};
+use crate::{Level, SimdCvtFloat, SimdCvtTruncate, SimdElement, SimdInto, seal::Seal};
 use crate::{
     f32x4, f32x8, f32x16, i8x16, i8x32, i8x64, i16x8, i16x16, i16x32, i32x4, i32x8, i32x16,
     mask8x16, mask8x32, mask8x64, mask16x8, mask16x16, mask16x32, mask32x4, mask32x8, mask32x16,
     u8x16, u8x32, u8x64, u16x8, u16x16, u16x32, u32x4, u32x8, u32x16,
 };
 #[doc = r" TODO: docstring"]
 pub trait Simd: Sized + Clone + Copy + Send + Sync + Seal + 'static {
-    type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>;
+    type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>
+        + SimdCvtFloat<Self::u32s>
+        + SimdCvtFloat<Self::i32s>;
     type u8s: SimdInt<u8, Self, Block = u8x16<Self>>;
     type i8s: SimdInt<i8, Self, Block = i8x16<Self>>;
     type u16s: SimdInt<u16, Self, Block = u16x8<Self>>;
     type i16s: SimdInt<i16, Self, Block = i16x8<Self>>;
-    type u32s: SimdInt<u32, Self, Block = u32x4<Self>>;
-    type i32s: SimdInt<i32, Self, Block = i32x4<Self>>;
+    type u32s: SimdInt<u32, Self, Block = u32x4<Self>> + SimdCvtTruncate<Self::f32s>;
+    type i32s: SimdInt<i32, Self, Block = i32x4<Self>> + SimdCvtTruncate<Self::f32s>;
     type mask8s: SimdMask<i8, Self, Block = mask8x16<Self>>;
     type mask16s: SimdMask<i16, Self, Block = mask16x8<Self>>;
     type mask32s: SimdMask<i32, Self, Block = mask32x4<Self>>;
@@ -667,6 +669,10 @@ pub trait SimdFloat<Element: SimdElement, S: Simd>:
     + core::ops::Div<Output = Self>
     + core::ops::Div<Element, Output = Self>
 {
+    #[inline(always)]
+    fn to_int<T: SimdCvtTruncate<Self>>(self) -> T {
+        T::truncate_from(self)
+    }
     fn abs(self) -> Self;
     fn sqrt(self) -> Self;
     fn copysign(self, rhs: impl SimdInto<Self, S>) -> Self;
@@ -702,6 +708,10 @@ pub trait SimdInt<Element: SimdElement, S: Simd>:
     + core::ops::BitXor<Output = Self>
     + core::ops::BitXor<Element, Output = Self>
 {
+    #[inline(always)]
+    fn to_float<T: SimdCvtFloat<Self>>(self) -> T {
+        T::float_from(self)
+    }
     fn simd_eq(self, rhs: impl SimdInto<Self, S>) -> Self::Mask;
     fn simd_lt(self, rhs: impl SimdInto<Self, S>) -> Self::Mask;
     fn simd_le(self, rhs: impl SimdInto<Self, S>) -> Self::Mask;
diff --git a/fearless_simd/src/generated/simd_types.rs b/fearless_simd/src/generated/simd_types.rs
@@ -1,6 +1,6 @@
 // This file is autogenerated by fearless_simd_gen
 
-use crate::{Bytes, Select, Simd, SimdFrom, SimdInto};
+use crate::{Bytes, Select, Simd, SimdCvtFloat, SimdCvtTruncate, SimdFrom, SimdInto};
 #[derive(Clone, Copy, Debug)]
 #[repr(C, align(16))]
 pub struct f32x4<S: Simd> {
@@ -269,6 +269,16 @@ impl<S: Simd> crate::SimdFloat<f32, S> for f32x4<S> {
         self.simd.trunc_f32x4(self)
     }
 }
+impl<S: Simd> SimdCvtFloat<u32x4<S>> for f32x4<S> {
+    fn float_from(x: u32x4<S>) -> Self {
+        x.simd.cvt_f32_u32x4(x)
+    }
+}
+impl<S: Simd> SimdCvtFloat<i32x4<S>> for f32x4<S> {
+    fn float_from(x: i32x4<S>) -> Self {
+        x.simd.cvt_f32_i32x4(x)
+    }
+}
 #[derive(Clone, Copy, Debug)]
 #[repr(C, align(16))]
 pub struct i8x16<S: Simd> {
@@ -1597,6 +1607,11 @@ impl<S: Simd> crate::SimdInt<i32, S> for i32x4<S> {
         self.simd.max_i32x4(self, rhs.simd_into(self.simd))
     }
 }
+impl<S: Simd> SimdCvtTruncate<f32x4<S>> for i32x4<S> {
+    fn truncate_from(x: f32x4<S>) -> Self {
+        x.simd.cvt_i32_f32x4(x)
+    }
+}
 #[derive(Clone, Copy, Debug)]
 #[repr(C, align(16))]
 pub struct u32x4<S: Simd> {
@@ -1803,6 +1818,11 @@ impl<S: Simd> crate::SimdInt<u32, S> for u32x4<S> {
         self.simd.max_u32x4(self, rhs.simd_into(self.simd))
     }
 }
+impl<S: Simd> SimdCvtTruncate<f32x4<S>> for u32x4<S> {
+    fn truncate_from(x: f32x4<S>) -> Self {
+        x.simd.cvt_u32_f32x4(x)
+    }
+}
 #[derive(Clone, Copy, Debug)]
 #[repr(C, align(16))]
 pub struct mask32x4<S: Simd> {
@@ -2200,6 +2220,16 @@ impl<S: Simd> crate::SimdFloat<f32, S> for f32x8<S> {
         self.simd.trunc_f32x8(self)
     }
 }
+impl<S: Simd> SimdCvtFloat<u32x8<S>> for f32x8<S> {
+    fn float_from(x: u32x8<S>) -> Self {
+        x.simd.cvt_f32_u32x8(x)
+    }
+}
+impl<S: Simd> SimdCvtFloat<i32x8<S>> for f32x8<S> {
+    fn float_from(x: i32x8<S>) -> Self {
+        x.simd.cvt_f32_i32x8(x)
+    }
+}
 #[derive(Clone, Copy, Debug)]
 #[repr(C, align(32))]
 pub struct i8x32<S: Simd> {
@@ -3609,6 +3639,11 @@ impl<S: Simd> crate::SimdInt<i32, S> for i32x8<S> {
         self.simd.max_i32x8(self, rhs.simd_into(self.simd))
     }
 }
+impl<S: Simd> SimdCvtTruncate<f32x8<S>> for i32x8<S> {
+    fn truncate_from(x: f32x8<S>) -> Self {
+        x.simd.cvt_i32_f32x8(x)
+    }
+}
 #[derive(Clone, Copy, Debug)]
 #[repr(C, align(32))]
 pub struct u32x8<S: Simd> {
@@ -3824,6 +3859,11 @@ impl<S: Simd> crate::SimdInt<u32, S> for u32x8<S> {
         self.simd.max_u32x8(self, rhs.simd_into(self.simd))
     }
 }
+impl<S: Simd> SimdCvtTruncate<f32x8<S>> for u32x8<S> {
+    fn truncate_from(x: f32x8<S>) -> Self {
+        x.simd.cvt_u32_f32x8(x)
+    }
+}
 #[derive(Clone, Copy, Debug)]
 #[repr(C, align(32))]
 pub struct mask32x8<S: Simd> {
@@ -4235,6 +4275,16 @@ impl<S: Simd> crate::SimdFloat<f32, S> for f32x16<S> {
         self.simd.trunc_f32x16(self)
     }
 }
+impl<S: Simd> SimdCvtFloat<u32x16<S>> for f32x16<S> {
+    fn float_from(x: u32x16<S>) -> Self {
+        x.simd.cvt_f32_u32x16(x)
+    }
+}
+impl<S: Simd> SimdCvtFloat<i32x16<S>> for f32x16<S> {
+    fn float_from(x: i32x16<S>) -> Self {
+        x.simd.cvt_f32_i32x16(x)
+    }
+}
 #[derive(Clone, Copy, Debug)]
 #[repr(C, align(64))]
 pub struct i8x64<S: Simd> {
@@ -5775,6 +5825,11 @@ impl<S: Simd> crate::SimdInt<i32, S> for i32x16<S> {
         self.simd.max_i32x16(self, rhs.simd_into(self.simd))
     }
 }
+impl<S: Simd> SimdCvtTruncate<f32x16<S>> for i32x16<S> {
+    fn truncate_from(x: f32x16<S>) -> Self {
+        x.simd.cvt_i32_f32x16(x)
+    }
+}
 #[derive(Clone, Copy, Debug)]
 #[repr(C, align(64))]
 pub struct u32x16<S: Simd> {
@@ -5995,6 +6050,11 @@ impl<S: Simd> crate::SimdInt<u32, S> for u32x16<S> {
         self.simd.max_u32x16(self, rhs.simd_into(self.simd))
     }
 }
+impl<S: Simd> SimdCvtTruncate<f32x16<S>> for u32x16<S> {
+    fn truncate_from(x: f32x16<S>) -> Self {
+        x.simd.cvt_u32_f32x16(x)
+    }
+}
 #[derive(Clone, Copy, Debug)]
 #[repr(C, align(64))]
 pub struct mask32x16<S: Simd> {
diff --git a/fearless_simd/src/traits.rs b/fearless_simd/src/traits.rs
@@ -105,3 +105,13 @@ impl SimdElement for u32 {
 impl SimdElement for i32 {
     type Mask = i32;
 }
+
+/// Construction of integer vectors from floats by truncation
+pub trait SimdCvtTruncate<T> {
+    fn truncate_from(x: T) -> Self;
+}
+
+/// Construction of floating point vectors from integers
+pub trait SimdCvtFloat<T> {
+    fn float_from(x: T) -> Self;
+}
diff --git a/fearless_simd_gen/src/mk_fallback.rs b/fearless_simd_gen/src/mk_fallback.rs
@@ -359,6 +359,7 @@ fn mk_simd_impl() -> TokenStream {
             methods.push(method);
         }
     }
+
     // Note: the `vectorize` implementation is pretty boilerplate and should probably
     // be factored out for DRY.
     quote! {
diff --git a/fearless_simd_gen/src/mk_neon.rs b/fearless_simd_gen/src/mk_neon.rs
@@ -364,6 +364,7 @@ fn mk_simd_impl(level: Level) -> TokenStream {
             methods.push(method);
         }
     }
+
     // Note: the `vectorize` implementation is pretty boilerplate and should probably
     // be factored out for DRY.
     quote! {
diff --git a/fearless_simd_gen/src/mk_simd_trait.rs b/fearless_simd_gen/src/mk_simd_trait.rs
@@ -26,18 +26,18 @@ pub fn mk_simd_trait() -> TokenStream {
         }
     }
     let mut code = quote! {
-        use crate::{seal::Seal, Level, SimdElement, SimdInto};
+        use crate::{seal::Seal, Level, SimdElement, SimdInto, SimdCvtTruncate, SimdCvtFloat};
         #imports
         /// TODO: docstring
         // TODO: Seal
         pub trait Simd: Sized + Clone + Copy + Send + Sync + Seal + 'static {
-            type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>;
+            type f32s: SimdFloat<f32, Self, Block = f32x4<Self>> + SimdCvtFloat<Self::u32s> + SimdCvtFloat<Self::i32s>;
             type u8s: SimdInt<u8, Self, Block = u8x16<Self>>;
             type i8s: SimdInt<i8, Self, Block = i8x16<Self>>;
             type u16s: SimdInt<u16, Self, Block = u16x8<Self>>;
             type i16s: SimdInt<i16, Self, Block = i16x8<Self>>;
-            type u32s: SimdInt<u32, Self, Block = u32x4<Self>>;
-            type i32s: SimdInt<i32, Self, Block = i32x4<Self>>;
+            type u32s: SimdInt<u32, Self, Block = u32x4<Self>> + SimdCvtTruncate<Self::f32s>;
+            type i32s: SimdInt<i32, Self, Block = i32x4<Self>> + SimdCvtTruncate<Self::f32s>;
             type mask8s: SimdMask<i8, Self, Block = mask8x16<Self>>;
             type mask16s: SimdMask<i16, Self, Block = mask16x8<Self>>;
             type mask32s: SimdMask<i32, Self, Block = mask32x4<Self>>;
@@ -101,6 +101,9 @@ fn mk_simd_float() -> TokenStream {
             + core::ops::Div<Output = Self>
             + core::ops::Div<Element, Output = Self>
         {
+            #[inline(always)]
+            fn to_int<T: SimdCvtTruncate<Self>>(self) -> T { T::truncate_from(self) }
+
             #( #methods )*
         }
     }
@@ -123,6 +126,9 @@ fn mk_simd_int() -> TokenStream {
             + core::ops::BitXor<Output = Self>
             + core::ops::BitXor<Element, Output = Self>
         {
+            #[inline(always)]
+            fn to_float<T: SimdCvtFloat<Self>>(self) -> T { T::float_from(self) }
+
             #( #methods )*
         }
     }
diff --git a/fearless_simd_gen/src/mk_simd_types.rs b/fearless_simd_gen/src/mk_simd_types.rs
@@ -2,7 +2,7 @@
 // SPDX-License-Identifier: Apache-2.0 OR MIT
 
 use proc_macro2::{Ident, Literal, Span, TokenStream};
-use quote::quote;
+use quote::{format_ident, quote};
 
 use crate::{
     ops::{CORE_OPS, OpSig, TyFlavor, ops_for_type},
@@ -11,7 +11,7 @@ use crate::{
 
 pub fn mk_simd_types() -> TokenStream {
     let mut result = quote! {
-        use crate::{Bytes, Select, Simd, SimdFrom, SimdInto};
+        use crate::{Bytes, Select, Simd, SimdFrom, SimdInto, SimdCvtFloat, SimdCvtTruncate};
     };
     for ty in SIMD_TYPES {
         let name = ty.rust();
@@ -42,6 +42,50 @@ pub fn mk_simd_types() -> TokenStream {
                 .map(|idx| quote! { val[#idx] })
                 .collect::<Vec<_>>(),
         );
+        let mut cvt_impls = Vec::new();
+        match ty.scalar {
+            ScalarType::Float => {
+                for src_scalar in [ScalarType::Unsigned, ScalarType::Int] {
+                    let src_ty = VecType {
+                        scalar: src_scalar,
+                        ..*ty
+                    };
+                    let method = format_ident!(
+                        "cvt_{}_{}",
+                        ty.scalar.rust_name(ty.scalar_bits),
+                        src_ty.rust_name()
+                    );
+                    let src_ty = src_ty.rust();
+                    cvt_impls.push(quote! {
+                        impl<S: Simd> SimdCvtFloat<#src_ty<S>> for #name<S> {
+                            fn float_from(x: #src_ty<S>) -> Self {
+                                x.simd.#method(x)
+                            }
+                        }
+                    });
+                }
+            }
+            ScalarType::Int | ScalarType::Unsigned if ty.scalar_bits == 32 => {
+                let src_ty = VecType {
+                    scalar: ScalarType::Float,
+                    ..*ty
+                };
+                let method = format_ident!(
+                    "cvt_{}_{}",
+                    ty.scalar.rust_name(ty.scalar_bits),
+                    src_ty.rust_name()
+                );
+                let src_ty = src_ty.rust();
+                cvt_impls.push(quote! {
+                    impl<S: Simd> SimdCvtTruncate<#src_ty<S>> for #name<S> {
+                        fn truncate_from(x: #src_ty<S>) -> Self {
+                            x.simd.#method(x)
+                        }
+                    }
+                });
+            }
+            _ => {}
+        }
         result.extend(quote! {
             #[derive(Clone, Copy, Debug)]
             #[repr(C, align(#align_lit))]
@@ -119,6 +163,8 @@ pub fn mk_simd_types() -> TokenStream {
             }
 
             #impl_block
+
+            #( #cvt_impls )*
         });
     }
     result
diff --git a/fearless_simd_gen/src/types.rs b/fearless_simd_gen/src/types.rs
@@ -28,9 +28,12 @@ impl ScalarType {
         }
     }
 
+    pub fn rust_name(&self, scalar_bits: usize) -> String {
+        format!("{}{}", self.prefix(), scalar_bits)
+    }
+
     pub fn rust(&self, scalar_bits: usize) -> TokenStream {
-        let name = format!("{}{}", self.prefix(), scalar_bits);
-        let ident = Ident::new(&name, Span::call_site());
+        let ident = Ident::new(&self.rust_name(scalar_bits), Span::call_site());
         quote! { #ident }
     }
 }
diff --git a/fearless_simd_tests/tests/mod.rs b/fearless_simd_tests/tests/mod.rs
@@ -1,8 +1,16 @@
 // Copyright 2025 the Fearless_SIMD Authors
 // SPDX-License-Identifier: Apache-2.0 OR MIT
 
+use fearless_simd::{Simd, SimdFloat};
+
 #[cfg(target_arch = "wasm32")]
 wasm_bindgen_test::wasm_bindgen_test_configure!(run_in_browser);
 
 #[cfg(all(target_arch = "wasm32", target_feature = "simd128"))]
 mod wasm;
+
+// Ensure that we can cast between generic native-width vectors
+#[allow(dead_code)]
+fn generic_cast<S: Simd>(x: S::f32s) -> S::u32s {
+    x.to_int()
+}

Original file line number	Diff line number	Diff line change
`@@ -359,6 +359,7 @@ fn mk_simd_impl() -> TokenStream {`
`359`	`359`	`methods.push(method);`
`360`	`360`	`}`
`361`	`361`	`}`
	`362`	`+`
`362`	`363`	// Note: the `vectorize` implementation is pretty boilerplate and should probably
`363`	`364`	`// be factored out for DRY.`
`364`	`365`	`quote! {`
Original file line number	Diff line number	Diff line change
`@@ -364,6 +364,7 @@ fn mk_simd_impl(level: Level) -> TokenStream {`
`364`	`364`	`methods.push(method);`
`365`	`365`	`}`
`366`	`366`	`}`
	`367`	`+`
`367`	`368`	// Note: the `vectorize` implementation is pretty boilerplate and should probably
`368`	`369`	`// be factored out for DRY.`
`369`	`370`	`quote! {`
Original file line number	Diff line number	Diff line change
`@@ -26,18 +26,18 @@ pub fn mk_simd_trait() -> TokenStream {`
`26`	`26`	`}`
`27`	`27`	`}`
`28`	`28`	`let mut code = quote! {`
`29`		`- use crate::{seal::Seal, Level, SimdElement, SimdInto};`
	`29`	`+ use crate::{seal::Seal, Level, SimdElement, SimdInto, SimdCvtTruncate, SimdCvtFloat};`
`30`	`30`	`#imports`
`31`	`31`	`/// TODO: docstring`
`32`	`32`	`// TODO: Seal`
`33`	`33`	`pub trait Simd: Sized + Clone + Copy + Send + Sync + Seal + 'static {`
`34`		`- type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>;`
	`34`	`+ type f32s: SimdFloat<f32, Self, Block = f32x4<Self>> + SimdCvtFloat<Self::u32s> + SimdCvtFloat<Self::i32s>;`
`35`	`35`	`type u8s: SimdInt<u8, Self, Block = u8x16<Self>>;`
`36`	`36`	`type i8s: SimdInt<i8, Self, Block = i8x16<Self>>;`
`37`	`37`	`type u16s: SimdInt<u16, Self, Block = u16x8<Self>>;`
`38`	`38`	`type i16s: SimdInt<i16, Self, Block = i16x8<Self>>;`
`39`		`- type u32s: SimdInt<u32, Self, Block = u32x4<Self>>;`
`40`		`- type i32s: SimdInt<i32, Self, Block = i32x4<Self>>;`
	`39`	`+ type u32s: SimdInt<u32, Self, Block = u32x4<Self>> + SimdCvtTruncate<Self::f32s>;`
	`40`	`+ type i32s: SimdInt<i32, Self, Block = i32x4<Self>> + SimdCvtTruncate<Self::f32s>;`
`41`	`41`	`type mask8s: SimdMask<i8, Self, Block = mask8x16<Self>>;`
`42`	`42`	`type mask16s: SimdMask<i16, Self, Block = mask16x8<Self>>;`
`43`	`43`	`type mask32s: SimdMask<i32, Self, Block = mask32x4<Self>>;`
`@@ -101,6 +101,9 @@ fn mk_simd_float() -> TokenStream {`
`101`	`101`	`+ core::ops::Div<Output = Self>`
`102`	`102`	`+ core::ops::Div<Element, Output = Self>`
`103`	`103`	`{`
	`104`	`+ #[inline(always)]`
	`105`	`+ fn to_int<T: SimdCvtTruncate<Self>>(self) -> T { T::truncate_from(self) }`
	`106`	`+`
`104`	`107`	`#( #methods )*`
`105`	`108`	`}`
`106`	`109`	`}`
`@@ -123,6 +126,9 @@ fn mk_simd_int() -> TokenStream {`
`123`	`126`	`+ core::ops::BitXor<Output = Self>`
`124`	`127`	`+ core::ops::BitXor<Element, Output = Self>`
`125`	`128`	`{`
	`129`	`+ #[inline(always)]`
	`130`	`+ fn to_float<T: SimdCvtFloat<Self>>(self) -> T { T::float_from(self) }`
	`131`	`+`
`126`	`132`	`#( #methods )*`
`127`	`133`	`}`
`128`	`134`	`}`
Original file line number	Diff line number	Diff line change
`@@ -28,9 +28,12 @@ impl ScalarType {`
`28`	`28`	`}`
`29`	`29`	`}`
`30`	`30`
	`31`	`+ pub fn rust_name(&self, scalar_bits: usize) -> String {`
	`32`	`+ format!("{}{}", self.prefix(), scalar_bits)`
	`33`	`+ }`
	`34`	`+`
`31`	`35`	`pub fn rust(&self, scalar_bits: usize) -> TokenStream {`
`32`		`- let name = format!("{}{}", self.prefix(), scalar_bits);`
`33`		`- let ident = Ident::new(&name, Span::call_site());`
	`36`	`+ let ident = Ident::new(&self.rust_name(scalar_bits), Span::call_site());`
`34`	`37`	`quote! { #ident }`
`35`	`38`	`}`
`36`	`39`	`}`