|
| 1 | +//@ compile-flags: -Cno-prepopulate-passes |
| 2 | + |
| 3 | +#![crate_type = "lib"] |
| 4 | +#![feature(repr_simd, core_intrinsics)] |
| 5 | +// make sure that codegen emits correctly-aligned loads and stores for repr(packed, simd) types |
| 6 | +// the alignment of a load should be no less than T, and no more than the size of the vector type |
| 7 | +use std::intrinsics::simd as intrinsics; |
| 8 | + |
| 9 | +#[derive(Copy, Clone)] |
| 10 | +#[repr(packed, simd)] |
| 11 | +struct f32x3([f32; 3]); |
| 12 | + |
| 13 | +#[derive(Copy, Clone)] |
| 14 | +#[repr(packed, simd)] |
| 15 | +struct f32x4([f32; 4]); |
| 16 | + |
| 17 | +// CHECK-LABEL: load_f32x3 |
| 18 | +#[no_mangle] |
| 19 | +pub fn load_f32x3(floats: &f32x3) -> f32x3 { |
| 20 | + // FIXME: Is a memcpy really the best we can do? |
| 21 | + // CHECK: @llvm.memcpy.{{.*}}ptr align 4 {{.*}}ptr align 4 |
| 22 | + *floats |
| 23 | +} |
| 24 | + |
| 25 | +// CHECK-LABEL: load_f32x4 |
| 26 | +#[no_mangle] |
| 27 | +pub fn load_f32x4(floats: &f32x4) -> f32x4 { |
| 28 | + // CHECK: load <4 x float>, ptr %{{[a-z0-9_]*}}, align {{4|8|16}} |
| 29 | + *floats |
| 30 | +} |
| 31 | + |
| 32 | +// CHECK-LABEL: add_f32x3 |
| 33 | +#[no_mangle] |
| 34 | +pub fn add_f32x3(x: f32x3, y: f32x3) -> f32x3 { |
| 35 | + // CHECK: load <3 x float>, ptr %{{[a-z0-9_]*}}, align 4 |
| 36 | + unsafe { intrinsics::simd_add(x, y) } |
| 37 | +} |
| 38 | + |
| 39 | +// CHECK-LABEL: add_f32x4 |
| 40 | +#[no_mangle] |
| 41 | +pub fn add_f32x4(x: f32x4, y: f32x4) -> f32x4 { |
| 42 | + // CHECK: load <4 x float>, ptr %{{[a-z0-9_]*}}, align {{4|8|16}} |
| 43 | + unsafe { intrinsics::simd_add(x, y) } |
| 44 | +} |
0 commit comments