core: Use __jcvt() intrinsic on AArch64 for f64→i32 conversion

linkmauve · linkmauve · commit c10d4de21acb · 2025-11-04T09:56:46.000+01:00
In ruffle-rs#21780, an optimisation has been added to use the fjcvtzs ARMv8.3 instruction when available, to convert a f64 into an i32. This made me wonder why core::arch::aarch64 didn’t have an intrinsic for this instruction, so I implemented it in stdarch[1], which got pulled in Rust yesterday[2] (see the tracking issue[3]). This PR makes use of this new intrinsic to remove the unsafe asm!() block, and simplify the code. [1] rust-lang/stdarch#1938 [2] rust-lang/rust#148402 [3] rust-lang/rust#147555
diff --git a/core/src/ecma_conversions.rs b/core/src/ecma_conversions.rs
@@ -44,8 +44,10 @@ pub fn f64_to_wrapping_i32(n: f64) -> i32 {
     #[cfg(target_arch = "aarch64")]
     {
         if std::arch::is_aarch64_feature_detected!("jsconv") {
-            // SAFETY: `jsconv` feature is checked in both compile time and runtime to be existed, so it's safe to call.
-            unsafe { f64_to_wrapping_int32_aarch64(n) }
+            // Converts an `f64` to an `i32` with ECMAScript `ToInt32` wrapping behavior.
+            // The value will be wrapped in the range [-2^31, 2^31).
+            // Optimized for aarch64 cpu with the fjcvtzs instruction.
+            std::arch::aarch64::__jcvt(n)
         } else {
             f64_to_wrapping_i32_generic(n)
         }
@@ -59,32 +61,6 @@ fn f64_to_wrapping_i32_generic(n: f64) -> i32 {
     f64_to_wrapping_u32(n) as i32
 }
 
-/// Converts an `f64` to an `i32` with ECMAScript `ToInt32` wrapping behavior.
-/// The value will be wrapped in the range [-2^31, 2^31).
-/// Optimized for aarch64 cpu with the fjcvtzs instruction.
-///
-/// # Safety
-///
-/// The caller must ensure either:
-/// - The target platform is aarch64 with `jsconv` feature enabled, or
-/// - Runtime feature detection has been performed to verify `jsconv` support
-#[allow(unused)]
-#[cfg(target_arch = "aarch64")]
-#[target_feature(enable = "jsconv")]
-unsafe fn f64_to_wrapping_int32_aarch64(number: f64) -> i32 {
-    let ret: i32;
-    // SAFETY: fjcvtzs instruction is available under jsconv feature.
-    unsafe {
-        std::arch::asm!(
-            "fjcvtzs {dst:w}, {src:d}",
-            src = in(vreg) number,
-            dst = out(reg) ret,
-            options(nostack, nomem, pure)
-        );
-    }
-    ret
-}
-
 /// Implements the IEEE-754 "Round to nearest, ties to even" rounding rule.
 /// (e.g., both 1.5 and 2.5 will round to 2).
 /// This also clamps out-of-range values and NaN to `i32::MIN`.
diff --git a/core/src/lib.rs b/core/src/lib.rs
@@ -4,6 +4,9 @@
 // This lint is good in theory, but in AVMs we often need to do `let x = args.get(0); let y = args.get(1);` etc.
 // It'd make those much less readable and consistent.
 #![allow(clippy::get_first)]
+// This enables the core::arch::aarch64::__jcvt() intrinsic, which is used to convert a f64 into an
+// i32 the JavaScript way on ARMv8.3+.
+#![feature(stdarch_aarch64_jscvt)]
 
 #[macro_use]
 mod display_object;