Skip to content

Commit

Permalink
fix ordering of lanes in neon
Browse files Browse the repository at this point in the history
  • Loading branch information
mcroomp committed Oct 20, 2024
1 parent db39ef2 commit 7b90e98
Showing 1 changed file with 4 additions and 1 deletion.
5 changes: 4 additions & 1 deletion src/u32x4_.rs
Original file line number Diff line number Diff line change
Expand Up @@ -458,7 +458,10 @@ impl u32x4 {
u64x2 { simd: i64x2_mul((self & i64x2::splat(0xffffffff)).simd, (rhs.simd & i64x2::splat(0xffffffff))).simd }
} else if #[cfg(all(target_feature="neon",target_arch="aarch64"))] {
unsafe {
u64x2 { neon: vmull_u32(vget_low_u32(self.neon), vget_low_u32(rhs.neon)) }
let a = vuzpq_u32(self.neon, self.neon);
let b = vuzpq_u32(rhs.neon, rhs.neon);

u64x2 { neon: vmull_u32(vget_low_u32(a), vget_low_u32(b)) }
}
} else {
let a: [u32; 4] = cast(self);
Expand Down

0 comments on commit 7b90e98

Please sign in to comment.