linebender
diff --git a/‎fearless_simd/src/generated/fallback.rs
Lines changed: 37 additions & 1 deletion b/‎fearless_simd/src/generated/fallback.rs
Lines changed: 37 additions & 1 deletion
diff --git a/‎fearless_simd/src/generated/neon.rs
Lines changed: 25 additions & 1 deletion b/‎fearless_simd/src/generated/neon.rs
Lines changed: 25 additions & 1 deletion
diff --git a/‎fearless_simd/src/generated/simd_trait.rs
Lines changed: 14 additions & 4 deletions b/‎fearless_simd/src/generated/simd_trait.rs
Lines changed: 14 additions & 4 deletions
diff --git a/‎fearless_simd/src/generated/wasm.rs
Lines changed: 25 additions & 1 deletion b/‎fearless_simd/src/generated/wasm.rs
Lines changed: 25 additions & 1 deletion
diff --git a/‎fearless_simd/src/traits.rs
Lines changed: 10 additions & 0 deletions b/‎fearless_simd/src/traits.rs
Lines changed: 10 additions & 0 deletions
diff --git a/‎fearless_simd_gen/src/mk_fallback.rs
Lines changed: 17 additions & 1 deletion b/‎fearless_simd_gen/src/mk_fallback.rs
Lines changed: 17 additions & 1 deletion
diff --git a/‎fearless_simd_gen/src/mk_neon.rs
Lines changed: 34 additions & 2 deletions b/‎fearless_simd_gen/src/mk_neon.rs
Lines changed: 34 additions & 2 deletions
diff --git a/‎fearless_simd_gen/src/mk_simd_trait.rs
Lines changed: 10 additions & 4 deletions b/‎fearless_simd_gen/src/mk_simd_trait.rs
Lines changed: 10 additions & 4 deletions
@@ -1,6 +1,6 @@
 // This file is autogenerated by fearless_simd_gen
 
-use crate::{Level, Simd, SimdInto, seal::Seal};
+use crate::{Level, Simd, SimdCvtFloat, SimdCvtTruncate, SimdInto, seal::Seal};
 use crate::{
     f32x4, f32x8, f32x16, i8x16, i8x32, i8x64, i16x8, i16x16, i16x32, i32x4, i32x8, i32x16,
     mask8x16, mask8x32, mask8x64, mask16x8, mask16x16, mask16x32, mask32x4, mask32x8, mask32x16,
@@ -4847,3 +4847,39 @@ impl Simd for Fallback {
         (b0.simd_into(self), b1.simd_into(self))
     }
 }
+impl SimdCvtTruncate<f32x4<Fallback>> for i32x4<Fallback> {
+    #[inline(always)]
+    fn truncate_from(x: f32x4<Fallback>) -> Self {
+        Self {
+            val: x.val.map(|e| e as i32),
+            simd: x.simd,
+        }
+    }
+}
+impl SimdCvtTruncate<f32x4<Fallback>> for u32x4<Fallback> {
+    #[inline(always)]
+    fn truncate_from(x: f32x4<Fallback>) -> Self {
+        Self {
+            val: x.val.map(|e| e as u32),
+            simd: x.simd,
+        }
+    }
+}
+impl SimdCvtFloat<i32x4<Fallback>> for f32x4<Fallback> {
+    #[inline(always)]
+    fn float_from(x: i32x4<Fallback>) -> Self {
+        Self {
+            val: x.val.map(|e| e as f32),
+            simd: x.simd,
+        }
+    }
+}
+impl SimdCvtFloat<u32x4<Fallback>> for f32x4<Fallback> {
+    #[inline(always)]
+    fn float_from(x: u32x4<Fallback>) -> Self {
+        Self {
+            val: x.val.map(|e| e as f32),
+            simd: x.simd,
+        }
+    }
+}
@@ -1,6 +1,6 @@
 // This file is autogenerated by fearless_simd_gen
 
-use crate::{Level, Simd, SimdFrom, SimdInto, seal::Seal};
+use crate::{Level, Simd, SimdCvtFloat, SimdCvtTruncate, SimdFrom, SimdInto, seal::Seal};
 use crate::{
     f32x4, f32x8, f32x16, i8x16, i8x32, i8x64, i16x8, i16x16, i16x32, i32x4, i32x8, i32x16,
     mask8x16, mask8x32, mask8x64, mask16x8, mask16x16, mask16x32, mask32x4, mask32x8, mask32x16,
@@ -3138,6 +3138,30 @@ impl Simd for Neon {
         (b0.simd_into(self), b1.simd_into(self))
     }
 }
+impl SimdCvtTruncate<f32x4<Neon>> for i32x4<Neon> {
+    #[inline(always)]
+    fn truncate_from(x: f32x4<Neon>) -> Self {
+        unsafe { vcvtq_s32_f32(x.into()).simd_into(x.simd) }
+    }
+}
+impl SimdCvtTruncate<f32x4<Neon>> for u32x4<Neon> {
+    #[inline(always)]
+    fn truncate_from(x: f32x4<Neon>) -> Self {
+        unsafe { vcvtq_u32_f32(x.into()).simd_into(x.simd) }
+    }
+}
+impl SimdCvtFloat<i32x4<Neon>> for f32x4<Neon> {
+    #[inline(always)]
+    fn float_from(x: i32x4<Neon>) -> Self {
+        unsafe { vcvtq_f32_s32(x.into()).simd_into(x.simd) }
+    }
+}
+impl SimdCvtFloat<u32x4<Neon>> for f32x4<Neon> {
+    #[inline(always)]
+    fn float_from(x: u32x4<Neon>) -> Self {
+        unsafe { vcvtq_f32_u32(x.into()).simd_into(x.simd) }
+    }
+}
 impl<S: Simd> SimdFrom<float32x4_t, S> for f32x4<S> {
     #[inline(always)]
     fn simd_from(arch: float32x4_t, simd: S) -> Self {
 
@@ -1,20 +1,22 @@
 // This file is autogenerated by fearless_simd_gen
 
-use crate::{Level, SimdElement, SimdInto, seal::Seal};
+use crate::{Level, SimdCvtFloat, SimdCvtTruncate, SimdElement, SimdInto, seal::Seal};
 use crate::{
     f32x4, f32x8, f32x16, i8x16, i8x32, i8x64, i16x8, i16x16, i16x32, i32x4, i32x8, i32x16,
     mask8x16, mask8x32, mask8x64, mask16x8, mask16x16, mask16x32, mask32x4, mask32x8, mask32x16,
     u8x16, u8x32, u8x64, u16x8, u16x16, u16x32, u32x4, u32x8, u32x16,
 };
 #[doc = r" TODO: docstring"]
 pub trait Simd: Sized + Clone + Copy + Send + Sync + Seal + 'static {
-    type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>;
+    type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>
+        + SimdCvtFloat<Self::u32s>
+        + SimdCvtFloat<Self::i32s>;
     type u8s: SimdInt<u8, Self, Block = u8x16<Self>>;
     type i8s: SimdInt<i8, Self, Block = i8x16<Self>>;
     type u16s: SimdInt<u16, Self, Block = u16x8<Self>>;
     type i16s: SimdInt<i16, Self, Block = i16x8<Self>>;
-    type u32s: SimdInt<u32, Self, Block = u32x4<Self>>;
-    type i32s: SimdInt<i32, Self, Block = i32x4<Self>>;
+    type u32s: SimdInt<u32, Self, Block = u32x4<Self>> + SimdCvtTruncate<Self::f32s>;
+    type i32s: SimdInt<i32, Self, Block = i32x4<Self>> + SimdCvtTruncate<Self::f32s>;
     type mask8s: SimdMask<i8, Self, Block = mask8x16<Self>>;
     type mask16s: SimdMask<i16, Self, Block = mask16x8<Self>>;
     type mask32s: SimdMask<i32, Self, Block = mask32x4<Self>>;
@@ -655,6 +657,10 @@ pub trait SimdFloat<Element: SimdElement, S: Simd>:
     + core::ops::Div<Output = Self>
     + core::ops::Div<Element, Output = Self>
 {
+    #[inline(always)]
+    fn to_int<T: SimdCvtTruncate<Self>>(self) -> T {
+        T::truncate_from(self)
+    }
     fn abs(self) -> Self;
     fn sqrt(self) -> Self;
     fn copysign(self, rhs: impl SimdInto<Self, S>) -> Self;
@@ -690,6 +696,10 @@ pub trait SimdInt<Element: SimdElement, S: Simd>:
     + core::ops::BitXor<Output = Self>
     + core::ops::BitXor<Element, Output = Self>
 {
+    #[inline(always)]
+    fn to_float<T: SimdCvtFloat<Self>>(self) -> T {
+        T::float_from(self)
+    }
     fn simd_eq(self, rhs: impl SimdInto<Self, S>) -> Self::Mask;
     fn simd_lt(self, rhs: impl SimdInto<Self, S>) -> Self::Mask;
     fn simd_le(self, rhs: impl SimdInto<Self, S>) -> Self::Mask;
 
@@ -1,6 +1,6 @@
 // This file is autogenerated by fearless_simd_gen
 
-use crate::{Level, Simd, SimdFrom, SimdInto, seal::Seal};
+use crate::{Level, Simd, SimdCvtFloat, SimdCvtTruncate, SimdFrom, SimdInto, seal::Seal};
 use crate::{
     f32x4, f32x8, f32x16, i8x16, i8x32, i8x64, i16x8, i16x16, i16x32, i32x4, i32x8, i32x16,
     mask8x16, mask8x32, mask8x64, mask16x8, mask16x16, mask16x32, mask32x4, mask32x8, mask32x16,
@@ -3277,6 +3277,30 @@ impl Simd for WasmSimd128 {
         (b0.simd_into(self), b1.simd_into(self))
     }
 }
+impl SimdCvtTruncate<f32x4<WasmSimd128>> for i32x4<WasmSimd128> {
+    #[inline(always)]
+    fn truncate_from(x: f32x4<WasmSimd128>) -> Self {
+        i32x4_trunc_sat_f32x4(x.into()).simd_into(x.simd)
+    }
+}
+impl SimdCvtTruncate<f32x4<WasmSimd128>> for u32x4<WasmSimd128> {
+    #[inline(always)]
+    fn truncate_from(x: f32x4<WasmSimd128>) -> Self {
+        u32x4_trunc_sat_f32x4(x.into()).simd_into(x.simd)
+    }
+}
+impl SimdCvtFloat<i32x4<WasmSimd128>> for f32x4<WasmSimd128> {
+    #[inline(always)]
+    fn float_from(x: i32x4<WasmSimd128>) -> Self {
+        f32x4_convert_i32x4(x.into()).simd_into(x.simd)
+    }
+}
+impl SimdCvtFloat<u32x4<WasmSimd128>> for f32x4<WasmSimd128> {
+    #[inline(always)]
+    fn float_from(x: u32x4<WasmSimd128>) -> Self {
+        f32x4_convert_u32x4(x.into()).simd_into(x.simd)
+    }
+}
 impl<S: Simd> SimdFrom<v128, S> for f32x4<S> {
     #[inline(always)]
     fn simd_from(arch: v128, simd: S) -> Self {
 
@@ -105,3 +105,13 @@ impl SimdElement for u32 {
 impl SimdElement for i32 {
     type Mask = i32;
 }
+
+/// Construction of integer vectors from floats by truncation
+pub trait SimdCvtTruncate<T> {
+    fn truncate_from(x: T) -> Self;
+}
+
+/// Construction of floating point vectors from integers
+pub trait SimdCvtFloat<T> {
+    fn float_from(x: T) -> Self;
+}
@@ -32,7 +32,7 @@ pub fn mk_fallback_impl() -> TokenStream {
 
     quote! {
         use core::ops::*;
-        use crate::{seal::Seal, Level, Simd, SimdInto};
+        use crate::{seal::Seal, Level, Simd, SimdInto, SimdCvtTruncate, SimdCvtFloat};
 
         #imports
 
@@ -342,6 +342,20 @@ fn mk_simd_impl() -> TokenStream {
             methods.push(method);
         }
     }
+
+    let cvts = crate::ops::conversions().map(|cvt| {
+        let dst_scalar = cvt.dst_scalar.rust(cvt.scalar_bits);
+        cvt.implement(
+            &level_tok,
+            quote! {
+                Self {
+                    val: x.val.map(|e| e as #dst_scalar),
+                    simd: x.simd,
+                }
+            },
+        )
+    });
+
     // Note: the `vectorize` implementation is pretty boilerplate and should probably
     // be factored out for DRY.
     quote! {
@@ -368,6 +382,8 @@ fn mk_simd_impl() -> TokenStream {
 
             #( #methods )*
         }
+
+        #( #cvts )*
     }
 }
 
 
@@ -2,7 +2,7 @@
 // SPDX-License-Identifier: Apache-2.0 OR MIT
 
 use proc_macro2::{Ident, Literal, Span, TokenStream};
-use quote::quote;
+use quote::{format_ident, quote};
 
 use crate::arch::neon::split_intrinsic;
 use crate::ops::{
@@ -44,7 +44,7 @@ pub fn mk_neon_impl(level: Level) -> TokenStream {
     quote! {
         use core::arch::aarch64::*;
 
-        use crate::{seal::Seal, Level, Simd, SimdFrom, SimdInto};
+        use crate::{seal::Seal, Level, Simd, SimdFrom, SimdInto, SimdCvtTruncate, SimdCvtFloat};
 
         #imports
 
@@ -352,6 +352,28 @@ fn mk_simd_impl(level: Level) -> TokenStream {
             methods.push(method);
         }
     }
+
+    let cvts = crate::ops::conversions().map(|cvt| {
+        let src_prefix = scalar_prefix(cvt.src_scalar);
+        let dst_prefix = scalar_prefix(cvt.dst_scalar);
+        let bits = cvt.scalar_bits;
+        let op = match cvt.len {
+            2 => "vcvt",
+            4 => "vcvtq",
+            _ => unimplemented!(),
+        };
+        // FIXME: Saturation?
+        let intrinsic = format_ident!("{op}_{dst_prefix}{bits}_{src_prefix}{bits}");
+        cvt.implement(
+            &level_tok,
+            quote! {
+                unsafe {
+                    #intrinsic(x.into()).simd_into(x.simd)
+                }
+            },
+        )
+    });
+
     // Note: the `vectorize` implementation is pretty boilerplate and should probably
     // be factored out for DRY.
     quote! {
@@ -384,6 +406,16 @@ fn mk_simd_impl(level: Level) -> TokenStream {
 
             #( #methods )*
         }
+
+        #( #cvts )*
+    }
+}
+
+fn scalar_prefix(ty: ScalarType) -> &'static str {
+    match ty {
+        ScalarType::Float => "f",
+        ScalarType::Unsigned | ScalarType::Mask => "u",
+        ScalarType::Int => "s",
     }
 }
 
 
@@ -26,18 +26,18 @@ pub fn mk_simd_trait() -> TokenStream {
         }
     }
     let mut code = quote! {
-        use crate::{seal::Seal, Level, SimdElement, SimdInto};
+        use crate::{seal::Seal, Level, SimdElement, SimdInto, SimdCvtTruncate, SimdCvtFloat};
         #imports
         /// TODO: docstring
         // TODO: Seal
         pub trait Simd: Sized + Clone + Copy + Send + Sync + Seal + 'static {
-            type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>;
+            type f32s: SimdFloat<f32, Self, Block = f32x4<Self>> + SimdCvtFloat<Self::u32s> + SimdCvtFloat<Self::i32s>;
             type u8s: SimdInt<u8, Self, Block = u8x16<Self>>;
             type i8s: SimdInt<i8, Self, Block = i8x16<Self>>;
             type u16s: SimdInt<u16, Self, Block = u16x8<Self>>;
             type i16s: SimdInt<i16, Self, Block = i16x8<Self>>;
-            type u32s: SimdInt<u32, Self, Block = u32x4<Self>>;
-            type i32s: SimdInt<i32, Self, Block = i32x4<Self>>;
+            type u32s: SimdInt<u32, Self, Block = u32x4<Self>> + SimdCvtTruncate<Self::f32s>;
+            type i32s: SimdInt<i32, Self, Block = i32x4<Self>> + SimdCvtTruncate<Self::f32s>;
             type mask8s: SimdMask<i8, Self, Block = mask8x16<Self>>;
             type mask16s: SimdMask<i16, Self, Block = mask16x8<Self>>;
             type mask32s: SimdMask<i32, Self, Block = mask32x4<Self>>;
@@ -101,6 +101,9 @@ fn mk_simd_float() -> TokenStream {
             + core::ops::Div<Output = Self>
             + core::ops::Div<Element, Output = Self>
         {
+            #[inline(always)]
+            fn to_int<T: SimdCvtTruncate<Self>>(self) -> T { T::truncate_from(self) }
+
             #( #methods )*
         }
     }
@@ -123,6 +126,9 @@ fn mk_simd_int() -> TokenStream {
             + core::ops::BitXor<Output = Self>
             + core::ops::BitXor<Element, Output = Self>
         {
+            #[inline(always)]
+            fn to_float<T: SimdCvtFloat<Self>>(self) -> T { T::float_from(self) }
+
             #( #methods )*
         }
     }
Original file line number	Diff line number	Diff line change
`@@ -26,18 +26,18 @@ pub fn mk_simd_trait() -> TokenStream {`
`26`	`26`	`}`
`27`	`27`	`}`
`28`	`28`	`let mut code = quote! {`
`29`		`- use crate::{seal::Seal, Level, SimdElement, SimdInto};`
	`29`	`+ use crate::{seal::Seal, Level, SimdElement, SimdInto, SimdCvtTruncate, SimdCvtFloat};`
`30`	`30`	`#imports`
`31`	`31`	`/// TODO: docstring`
`32`	`32`	`// TODO: Seal`
`33`	`33`	`pub trait Simd: Sized + Clone + Copy + Send + Sync + Seal + 'static {`
`34`		`- type f32s: SimdFloat<f32, Self, Block = f32x4<Self>>;`
	`34`	`+ type f32s: SimdFloat<f32, Self, Block = f32x4<Self>> + SimdCvtFloat<Self::u32s> + SimdCvtFloat<Self::i32s>;`
`35`	`35`	`type u8s: SimdInt<u8, Self, Block = u8x16<Self>>;`
`36`	`36`	`type i8s: SimdInt<i8, Self, Block = i8x16<Self>>;`
`37`	`37`	`type u16s: SimdInt<u16, Self, Block = u16x8<Self>>;`
`38`	`38`	`type i16s: SimdInt<i16, Self, Block = i16x8<Self>>;`
`39`		`- type u32s: SimdInt<u32, Self, Block = u32x4<Self>>;`
`40`		`- type i32s: SimdInt<i32, Self, Block = i32x4<Self>>;`
	`39`	`+ type u32s: SimdInt<u32, Self, Block = u32x4<Self>> + SimdCvtTruncate<Self::f32s>;`
	`40`	`+ type i32s: SimdInt<i32, Self, Block = i32x4<Self>> + SimdCvtTruncate<Self::f32s>;`
`41`	`41`	`type mask8s: SimdMask<i8, Self, Block = mask8x16<Self>>;`
`42`	`42`	`type mask16s: SimdMask<i16, Self, Block = mask16x8<Self>>;`
`43`	`43`	`type mask32s: SimdMask<i32, Self, Block = mask32x4<Self>>;`
`@@ -101,6 +101,9 @@ fn mk_simd_float() -> TokenStream {`
`101`	`101`	`+ core::ops::Div<Output = Self>`
`102`	`102`	`+ core::ops::Div<Element, Output = Self>`
`103`	`103`	`{`
	`104`	`+ #[inline(always)]`
	`105`	`+ fn to_int<T: SimdCvtTruncate<Self>>(self) -> T { T::truncate_from(self) }`
	`106`	`+`
`104`	`107`	`#( #methods )*`
`105`	`108`	`}`
`106`	`109`	`}`
`@@ -123,6 +126,9 @@ fn mk_simd_int() -> TokenStream {`
`123`	`126`	`+ core::ops::BitXor<Output = Self>`
`124`	`127`	`+ core::ops::BitXor<Element, Output = Self>`
`125`	`128`	`{`
	`129`	`+ #[inline(always)]`
	`130`	`+ fn to_float<T: SimdCvtFloat<Self>>(self) -> T { T::float_from(self) }`
	`131`	`+`
`126`	`132`	`#( #methods )*`
`127`	`133`	`}`
`128`	`134`	`}`