|
6 | 6 | #[repr(simd, packed)]
|
7 | 7 | struct Simd<T, const N: usize>([T; N]);
|
8 | 8 |
|
| 9 | +#[repr(simd)] |
| 10 | +struct FullSimd<T, const N: usize>([T; N]); |
| 11 | + |
9 | 12 | fn check_size_align<T, const N: usize>() {
|
10 | 13 | use std::mem;
|
11 | 14 | assert_eq!(mem::size_of::<Simd<T, N>>(), mem::size_of::<[T; N]>());
|
@@ -37,9 +40,20 @@ fn main() {
|
37 | 40 |
|
38 | 41 | unsafe {
|
39 | 42 | // powers-of-two have no padding and work as usual
|
40 |
| - // non-powers-of-two have padding and need to be expanded to full vectors |
41 | 43 | let x: Simd<f64, 4> =
|
42 | 44 | simd_add(Simd::<f64, 4>([0., 1., 2., 3.]), Simd::<f64, 4>([2., 2., 2., 2.]));
|
43 | 45 | assert_eq!(std::mem::transmute::<_, [f64; 4]>(x), [2., 3., 4., 5.]);
|
| 46 | + |
| 47 | + // non-powers-of-two have padding and need to be expanded to full vectors |
| 48 | + fn load<T, const N: usize>(v: Simd<T, N>) -> FullSimd<T, N> { |
| 49 | + unsafe { |
| 50 | + let mut tmp = core::mem::MaybeUninit::<FullSimd<T, N>>::uninit(); |
| 51 | + std::ptr::copy_nonoverlapping(&v as *const _, tmp.as_mut_ptr().cast(), 1); |
| 52 | + tmp.assume_init() |
| 53 | + } |
| 54 | + } |
| 55 | + let x: FullSimd<f64, 3> = |
| 56 | + simd_add(load(Simd::<f64, 3>([0., 1., 2.])), load(Simd::<f64, 3>([2., 2., 2.]))); |
| 57 | + assert_eq!(x.0, [2., 3., 4.]); |
44 | 58 | }
|
45 | 59 | }
|
0 commit comments