Introduce SimdCvt trait family

Ralith · Ralith · commit 5b8350016237 · 2025-07-09T20:59:23.000-07:00
diff --git a/fearless_simd/src/generated/fallback.rs b/fearless_simd/src/generated/fallback.rs
@@ -1,6 +1,6 @@
 // This file is autogenerated by fearless_simd_gen
 
-use crate::{Level, Simd, SimdInto, seal::Seal};
+use crate::{Level, Simd, SimdCvtFloat, SimdCvtTruncate, SimdInto, seal::Seal};
 use crate::{
     f32x4, f32x8, f32x16, i8x16, i8x32, i8x64, i16x8, i16x16, i16x32, i32x4, i32x8, i32x16,
     mask8x16, mask8x32, mask8x64, mask16x8, mask16x16, mask16x32, mask32x4, mask32x8, mask32x16,
@@ -4887,3 +4887,21 @@ impl Simd for Fallback {
         (b0.simd_into(self), b1.simd_into(self))
     }
 }
+impl SimdCvtTruncate<f32x4<Fallback>> for u32x4<Fallback> {
+    #[inline(always)]
+    fn truncate_from(x: f32x4<Fallback>) -> Self {
+        Self {
+            val: x.val.map(|e| e as u32),
+            simd: x.simd,
+        }
+    }
+}
+impl SimdCvtFloat<u32x4<Fallback>> for f32x4<Fallback> {
+    #[inline(always)]
+    fn float_from(x: u32x4<Fallback>) -> Self {
+        Self {
+            val: x.val.map(|e| e as f32),
+            simd: x.simd,
+        }
+    }
+}
diff --git a/fearless_simd/src/generated/neon.rs b/fearless_simd/src/generated/neon.rs
@@ -1,6 +1,6 @@
 // This file is autogenerated by fearless_simd_gen
 
-use crate::{Level, Simd, SimdFrom, SimdInto, seal::Seal};
+use crate::{Level, Simd, SimdCvtFloat, SimdCvtTruncate, SimdFrom, SimdInto, seal::Seal};
 use crate::{
     f32x4, f32x8, f32x16, i8x16, i8x32, i8x64, i16x8, i16x16, i16x32, i32x4, i32x8, i32x16,
     mask8x16, mask8x32, mask8x64, mask16x8, mask16x16, mask16x32, mask32x4, mask32x8, mask32x16,
@@ -3166,6 +3166,18 @@ impl Simd for Neon {
         (b0.simd_into(self), b1.simd_into(self))
     }
 }
+impl SimdCvtTruncate<f32x4<Neon>> for u32x4<Neon> {
+    #[inline(always)]
+    fn truncate_from(x: f32x4<Neon>) -> Self {
+        unsafe { vcvtq_u32_f32(x.into()).simd_into(x.simd) }
+    }
+}
+impl SimdCvtFloat<u32x4<Neon>> for f32x4<Neon> {
+    #[inline(always)]
+    fn float_from(x: u32x4<Neon>) -> Self {
+        unsafe { vcvt_f32_u32(x.into).simd_into(x.simd) }
+    }
+}
 impl<S: Simd> SimdFrom<float32x4_t, S> for f32x4<S> {
     #[inline(always)]
     fn simd_from(arch: float32x4_t, simd: S) -> Self {
diff --git a/fearless_simd/src/generated/simd_trait.rs b/fearless_simd/src/generated/simd_trait.rs
@@ -1,19 +1,19 @@
 // This file is autogenerated by fearless_simd_gen
 
-use crate::{Level, SimdElement, SimdInto, seal::Seal};
+use crate::{Level, SimdCvtFloat, SimdCvtTruncate, SimdElement, SimdInto, seal::Seal};
 use crate::{
     f32x4, f32x8, f32x16, i8x16, i8x32, i8x64, i16x8, i16x16, i16x32, i32x4, i32x8, i32x16,
     mask8x16, mask8x32, mask8x64, mask16x8, mask16x16, mask16x32, mask32x4, mask32x8, mask32x16,
     u8x16, u8x32, u8x64, u16x8, u16x16, u16x32, u32x4, u32x8, u32x16,
 };
 #[doc = r" TODO: docstring"]
 pub trait Simd: Sized + Clone + Copy + Send + Sync + Seal + 'static {
-    type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>;
+    type f32s: SimdFloat<f32, Self, Block = f32x4<Self>> + SimdCvtFloat<Self::u32s>;
     type u8s: SimdInt<u8, Self, Block = u8x16<Self>>;
     type i8s: SimdInt<i8, Self, Block = i8x16<Self>>;
     type u16s: SimdInt<u16, Self, Block = u16x8<Self>>;
     type i16s: SimdInt<i16, Self, Block = i16x8<Self>>;
-    type u32s: SimdInt<u32, Self, Block = u32x4<Self>>;
+    type u32s: SimdInt<u32, Self, Block = u32x4<Self>> + SimdCvtTruncate<Self::f32s>;
     type i32s: SimdInt<i32, Self, Block = i32x4<Self>>;
     type mask8s: SimdMask<i8, Self, Block = mask8x16<Self>>;
     type mask16s: SimdMask<i16, Self, Block = mask16x8<Self>>;
@@ -661,6 +661,10 @@ pub trait SimdFloat<Element: SimdElement, S: Simd>:
     + core::ops::Div<Output = Self>
     + core::ops::Div<Element, Output = Self>
 {
+    #[inline(always)]
+    fn cvt_trunc<T: SimdCvtTruncate<Self>>(self) -> T {
+        T::truncate_from(self)
+    }
     fn abs(self) -> Self;
     fn sqrt(self) -> Self;
     fn copysign(self, rhs: impl SimdInto<Self, S>) -> Self;
@@ -696,6 +700,10 @@ pub trait SimdInt<Element: SimdElement, S: Simd>:
     + core::ops::BitXor<Output = Self>
     + core::ops::BitXor<Element, Output = Self>
 {
+    #[inline(always)]
+    fn cvt_float<T: SimdCvtFloat<Self>>(self) -> T {
+        T::float_from(self)
+    }
     fn simd_eq(self, rhs: impl SimdInto<Self, S>) -> Self::Mask;
     fn simd_lt(self, rhs: impl SimdInto<Self, S>) -> Self::Mask;
     fn simd_le(self, rhs: impl SimdInto<Self, S>) -> Self::Mask;
diff --git a/fearless_simd/src/generated/wasm.rs b/fearless_simd/src/generated/wasm.rs
@@ -1,6 +1,6 @@
 // This file is autogenerated by fearless_simd_gen
 
-use crate::{Level, Simd, SimdFrom, SimdInto, seal::Seal};
+use crate::{Level, Simd, SimdCvtFloat, SimdCvtTruncate, SimdFrom, SimdInto, seal::Seal};
 use crate::{
     f32x4, f32x8, f32x16, i8x16, i8x32, i8x64, i16x8, i16x16, i16x32, i32x4, i32x8, i32x16,
     mask8x16, mask8x32, mask8x64, mask16x8, mask16x16, mask16x32, mask32x4, mask32x8, mask32x16,
@@ -3305,6 +3305,18 @@ impl Simd for WasmSimd128 {
         (b0.simd_into(self), b1.simd_into(self))
     }
 }
+impl SimdCvtTruncate<f32x4<WasmSimd128>> for u32x4<WasmSimd128> {
+    #[inline(always)]
+    fn truncate_from(x: f32x4<WasmSimd128>) -> Self {
+        u32x4_trunc_sat_f32x4(x.into()).simd_into(x.simd)
+    }
+}
+impl SimdCvtFloat<u32x4<WasmSimd128>> for f32x4<WasmSimd128> {
+    #[inline(always)]
+    fn float_from(x: u32x4<WasmSimd128>) -> Self {
+        f32x4_convert_u32x4(x.into()).simd_into(x.simd)
+    }
+}
 impl<S: Simd> SimdFrom<v128, S> for f32x4<S> {
     #[inline(always)]
     fn simd_from(arch: v128, simd: S) -> Self {
diff --git a/fearless_simd/src/traits.rs b/fearless_simd/src/traits.rs
@@ -105,3 +105,13 @@ impl SimdElement for u32 {
 impl SimdElement for i32 {
     type Mask = i32;
 }
+
+/// Construction of integer vectors from floats by truncation
+pub trait SimdCvtTruncate<T> {
+    fn truncate_from(x: T) -> Self;
+}
+
+/// Construction of floating point vectors from integers
+pub trait SimdCvtFloat<T> {
+    fn float_from(x: T) -> Self;
+}
diff --git a/fearless_simd_gen/src/mk_fallback.rs b/fearless_simd_gen/src/mk_fallback.rs
@@ -32,7 +32,7 @@ pub fn mk_fallback_impl() -> TokenStream {
 
     quote! {
         use core::ops::*;
-        use crate::{seal::Seal, Level, Simd, SimdInto};
+        use crate::{seal::Seal, Level, Simd, SimdInto, SimdCvtTruncate, SimdCvtFloat};
 
         #imports
 
@@ -385,6 +385,26 @@ fn mk_simd_impl() -> TokenStream {
 
             #( #methods )*
         }
+
+        impl SimdCvtTruncate<f32x4<#level_tok>> for u32x4<#level_tok> {
+            #[inline(always)]
+            fn truncate_from(x: f32x4<#level_tok>) -> Self {
+                Self {
+                    val: x.val.map(|e| e as u32),
+                    simd: x.simd,
+                }
+            }
+        }
+
+        impl SimdCvtFloat<u32x4<#level_tok>> for f32x4<#level_tok> {
+            #[inline(always)]
+            fn float_from(x: u32x4<#level_tok>) -> Self {
+                Self {
+                    val: x.val.map(|e| e as f32),
+                    simd: x.simd,
+                }
+            }
+        }
     }
 }
 
diff --git a/fearless_simd_gen/src/mk_neon.rs b/fearless_simd_gen/src/mk_neon.rs
@@ -44,7 +44,7 @@ pub fn mk_neon_impl(level: Level) -> TokenStream {
     quote! {
         use core::arch::aarch64::*;
 
-        use crate::{seal::Seal, Level, Simd, SimdFrom, SimdInto};
+        use crate::{seal::Seal, Level, Simd, SimdFrom, SimdInto, SimdCvtTruncate, SimdCvtFloat};
 
         #imports
 
@@ -396,6 +396,24 @@ fn mk_simd_impl(level: Level) -> TokenStream {
 
             #( #methods )*
         }
+
+        impl SimdCvtTruncate<f32x4<#level_tok>> for u32x4<#level_tok> {
+            #[inline(always)]
+            fn truncate_from(x: f32x4<#level_tok>) -> Self {
+                unsafe {
+                    vcvtq_u32_f32(x.into()).simd_into(x.simd)
+                }
+            }
+        }
+
+        impl SimdCvtFloat<u32x4<#level_tok>> for f32x4<#level_tok> {
+            #[inline(always)]
+            fn float_from(x: u32x4<#level_tok>) -> Self {
+                unsafe {
+                    vcvt_f32_u32(x.into).simd_into(x.simd)
+                }
+            }
+        }
     }
 }
 
diff --git a/fearless_simd_gen/src/mk_simd_trait.rs b/fearless_simd_gen/src/mk_simd_trait.rs
@@ -26,17 +26,17 @@ pub fn mk_simd_trait() -> TokenStream {
         }
     }
     let mut code = quote! {
-        use crate::{seal::Seal, Level, SimdElement, SimdInto};
+        use crate::{seal::Seal, Level, SimdElement, SimdInto, SimdCvtTruncate, SimdCvtFloat};
         #imports
         /// TODO: docstring
         // TODO: Seal
         pub trait Simd: Sized + Clone + Copy + Send + Sync + Seal + 'static {
-            type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>;
+            type f32s: SimdFloat<f32, Self, Block = f32x4<Self>> + SimdCvtFloat<Self::u32s>;
             type u8s: SimdInt<u8, Self, Block = u8x16<Self>>;
             type i8s: SimdInt<i8, Self, Block = i8x16<Self>>;
             type u16s: SimdInt<u16, Self, Block = u16x8<Self>>;
             type i16s: SimdInt<i16, Self, Block = i16x8<Self>>;
-            type u32s: SimdInt<u32, Self, Block = u32x4<Self>>;
+            type u32s: SimdInt<u32, Self, Block = u32x4<Self>> + SimdCvtTruncate<Self::f32s>;
             type i32s: SimdInt<i32, Self, Block = i32x4<Self>>;
             type mask8s: SimdMask<i8, Self, Block = mask8x16<Self>>;
             type mask16s: SimdMask<i16, Self, Block = mask16x8<Self>>;
@@ -101,6 +101,9 @@ fn mk_simd_float() -> TokenStream {
             + core::ops::Div<Output = Self>
             + core::ops::Div<Element, Output = Self>
         {
+            #[inline(always)]
+            fn cvt_trunc<T: SimdCvtTruncate<Self>>(self) -> T { T::truncate_from(self) }
+
             #( #methods )*
         }
     }
@@ -123,6 +126,9 @@ fn mk_simd_int() -> TokenStream {
             + core::ops::BitXor<Output = Self>
             + core::ops::BitXor<Element, Output = Self>
         {
+            #[inline(always)]
+            fn cvt_float<T: SimdCvtFloat<Self>>(self) -> T { T::float_from(self) }
+
             #( #methods )*
         }
     }
diff --git a/fearless_simd_gen/src/mk_wasm.rs b/fearless_simd_gen/src/mk_wasm.rs
@@ -500,6 +500,20 @@ fn mk_simd_impl(level: Level) -> TokenStream {
 
             #( #methods )*
         }
+
+        impl SimdCvtTruncate<f32x4<#level_tok>> for u32x4<#level_tok> {
+            #[inline(always)]
+            fn truncate_from(x: f32x4<#level_tok>) -> Self {
+                u32x4_trunc_sat_f32x4(x.into()).simd_into(x.simd)
+            }
+        }
+
+        impl SimdCvtFloat<u32x4<#level_tok>> for f32x4<#level_tok> {
+            #[inline(always)]
+            fn float_from(x: u32x4<#level_tok>) -> Self {
+                f32x4_convert_u32x4(x.into()).simd_into(x.simd)
+            }
+        }
     }
 }
 
@@ -512,7 +526,7 @@ pub fn mk_wasm128_impl(level: Level) -> TokenStream {
     quote! {
         use core::arch::wasm32::*;
 
-        use crate::{seal::Seal, Level, Simd, SimdFrom, SimdInto};
+        use crate::{seal::Seal, Level, Simd, SimdFrom, SimdInto, SimdCvtTruncate, SimdCvtFloat};
 
         #imports
 
diff --git a/fearless_simd_tests/tests/mod.rs b/fearless_simd_tests/tests/mod.rs
@@ -1,8 +1,16 @@
 // Copyright 2025 the Fearless_SIMD Authors
 // SPDX-License-Identifier: Apache-2.0 OR MIT
 
+use fearless_simd::{Simd, SimdFloat};
+
 #[cfg(target_arch = "wasm32")]
 wasm_bindgen_test::wasm_bindgen_test_configure!(run_in_browser);
 
 #[cfg(all(target_arch = "wasm32", target_feature = "simd128"))]
 mod wasm;
+
+// Ensure that we can cast between generic native-width vectors
+#[allow(dead_code)]
+fn generic_cast<S: Simd>(x: S::f32s) -> S::u32s {
+    x.cvt_trunc()
+}

Original file line number	Diff line number	Diff line change
`@@ -26,17 +26,17 @@ pub fn mk_simd_trait() -> TokenStream {`
`26`	`26`	`}`
`27`	`27`	`}`
`28`	`28`	`let mut code = quote! {`
`29`		`- use crate::{seal::Seal, Level, SimdElement, SimdInto};`
	`29`	`+ use crate::{seal::Seal, Level, SimdElement, SimdInto, SimdCvtTruncate, SimdCvtFloat};`
`30`	`30`	`#imports`
`31`	`31`	`/// TODO: docstring`
`32`	`32`	`// TODO: Seal`
`33`	`33`	`pub trait Simd: Sized + Clone + Copy + Send + Sync + Seal + 'static {`
`34`		`- type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>;`
	`34`	`+ type f32s: SimdFloat<f32, Self, Block = f32x4<Self>> + SimdCvtFloat<Self::u32s>;`
`35`	`35`	`type u8s: SimdInt<u8, Self, Block = u8x16<Self>>;`
`36`	`36`	`type i8s: SimdInt<i8, Self, Block = i8x16<Self>>;`
`37`	`37`	`type u16s: SimdInt<u16, Self, Block = u16x8<Self>>;`
`38`	`38`	`type i16s: SimdInt<i16, Self, Block = i16x8<Self>>;`
`39`		`- type u32s: SimdInt<u32, Self, Block = u32x4<Self>>;`
	`39`	`+ type u32s: SimdInt<u32, Self, Block = u32x4<Self>> + SimdCvtTruncate<Self::f32s>;`
`40`	`40`	`type i32s: SimdInt<i32, Self, Block = i32x4<Self>>;`
`41`	`41`	`type mask8s: SimdMask<i8, Self, Block = mask8x16<Self>>;`
`42`	`42`	`type mask16s: SimdMask<i16, Self, Block = mask16x8<Self>>;`
`@@ -101,6 +101,9 @@ fn mk_simd_float() -> TokenStream {`
`101`	`101`	`+ core::ops::Div<Output = Self>`
`102`	`102`	`+ core::ops::Div<Element, Output = Self>`
`103`	`103`	`{`
	`104`	`+ #[inline(always)]`
	`105`	`+ fn cvt_trunc<T: SimdCvtTruncate<Self>>(self) -> T { T::truncate_from(self) }`
	`106`	`+`
`104`	`107`	`#( #methods )*`
`105`	`108`	`}`
`106`	`109`	`}`
`@@ -123,6 +126,9 @@ fn mk_simd_int() -> TokenStream {`
`123`	`126`	`+ core::ops::BitXor<Output = Self>`
`124`	`127`	`+ core::ops::BitXor<Element, Output = Self>`
`125`	`128`	`{`
	`129`	`+ #[inline(always)]`
	`130`	`+ fn cvt_float<T: SimdCvtFloat<Self>>(self) -> T { T::float_from(self) }`
	`131`	`+`
`126`	`132`	`#( #methods )*`
`127`	`133`	`}`
`128`	`134`	`}`