Skip to content

Commit 9239a91

Browse files
committed
add simd_insert_dyn and simd_extract_dyn
1 parent 249cb84 commit 9239a91

File tree

6 files changed

+190
-7
lines changed

6 files changed

+190
-7
lines changed

compiler/rustc_codegen_llvm/src/intrinsic.rs

+24
Original file line numberDiff line numberDiff line change
@@ -1445,6 +1445,23 @@ fn generic_simd_intrinsic<'ll, 'tcx>(
14451445
bx.const_i32(idx as i32),
14461446
));
14471447
}
1448+
if name == sym::simd_insert_dyn {
1449+
require!(
1450+
in_elem == arg_tys[2],
1451+
InvalidMonomorphization::InsertedType {
1452+
span,
1453+
name,
1454+
in_elem,
1455+
in_ty,
1456+
out_ty: arg_tys[2]
1457+
}
1458+
);
1459+
return Ok(bx.insert_element(
1460+
args[0].immediate(),
1461+
args[2].immediate(),
1462+
args[1].immediate(),
1463+
));
1464+
}
14481465
if name == sym::simd_extract {
14491466
require!(
14501467
ret_ty == in_elem,
@@ -1463,6 +1480,13 @@ fn generic_simd_intrinsic<'ll, 'tcx>(
14631480
}
14641481
return Ok(bx.extract_element(args[0].immediate(), bx.const_i32(idx as i32)));
14651482
}
1483+
if name == sym::simd_extract_dyn {
1484+
require!(
1485+
ret_ty == in_elem,
1486+
InvalidMonomorphization::ReturnType { span, name, in_elem, in_ty, ret_ty }
1487+
);
1488+
return Ok(bx.extract_element(args[0].immediate(), args[1].immediate()));
1489+
}
14661490

14671491
if name == sym::simd_select {
14681492
let m_elem_ty = in_elem;

compiler/rustc_hir_analysis/src/check/intrinsic.rs

+6-2
Original file line numberDiff line numberDiff line change
@@ -674,8 +674,12 @@ pub fn check_intrinsic_type(
674674
sym::simd_masked_load => (3, 0, vec![param(0), param(1), param(2)], param(2)),
675675
sym::simd_masked_store => (3, 0, vec![param(0), param(1), param(2)], tcx.types.unit),
676676
sym::simd_scatter => (3, 0, vec![param(0), param(1), param(2)], tcx.types.unit),
677-
sym::simd_insert => (2, 0, vec![param(0), tcx.types.u32, param(1)], param(0)),
678-
sym::simd_extract => (2, 0, vec![param(0), tcx.types.u32], param(1)),
677+
sym::simd_insert | sym::simd_insert_dyn => {
678+
(2, 0, vec![param(0), tcx.types.u32, param(1)], param(0))
679+
}
680+
sym::simd_extract | sym::simd_extract_dyn => {
681+
(2, 0, vec![param(0), tcx.types.u32], param(1))
682+
}
679683
sym::simd_cast
680684
| sym::simd_as
681685
| sym::simd_cast_ptr

compiler/rustc_span/src/symbol.rs

+2
Original file line numberDiff line numberDiff line change
@@ -1885,6 +1885,7 @@ symbols! {
18851885
simd_eq,
18861886
simd_expose_provenance,
18871887
simd_extract,
1888+
simd_extract_dyn,
18881889
simd_fabs,
18891890
simd_fcos,
18901891
simd_fexp,
@@ -1903,6 +1904,7 @@ symbols! {
19031904
simd_ge,
19041905
simd_gt,
19051906
simd_insert,
1907+
simd_insert_dyn,
19061908
simd_le,
19071909
simd_lt,
19081910
simd_masked_load,

library/core/src/intrinsics/simd.rs

+36-3
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
55
/// Inserts an element into a vector, returning the updated vector.
66
///
7-
/// `T` must be a vector with element type `U`.
7+
/// `T` must be a vector with element type `U`, and `idx` must be `const`.
88
///
99
/// # Safety
1010
///
@@ -15,15 +15,48 @@ pub const unsafe fn simd_insert<T, U>(x: T, idx: u32, val: U) -> T;
1515

1616
/// Extracts an element from a vector.
1717
///
18-
/// `T` must be a vector with element type `U`.
18+
/// `T` must be a vector with element type `U`, and `idx` must be `const`.
1919
///
2020
/// # Safety
2121
///
22-
/// `idx` must be in-bounds of the vector.
22+
/// `idx` must be const and in-bounds of the vector.
2323
#[rustc_intrinsic]
2424
#[rustc_nounwind]
2525
pub const unsafe fn simd_extract<T, U>(x: T, idx: u32) -> U;
2626

27+
/// Inserts an element into a vector, returning the updated vector.
28+
///
29+
/// `T` must be a vector with element type `U`.
30+
///
31+
/// If the index is `const`, [`simd_insert`] may emit better assembly.
32+
///
33+
/// # Safety
34+
///
35+
/// `idx` must be in-bounds of the vector.
36+
#[rustc_nounwind]
37+
#[cfg_attr(not(bootstrap), rustc_intrinsic)]
38+
pub unsafe fn simd_insert_dyn<T, U>(mut x: T, idx: u32, val: U) -> T {
39+
// SAFETY: `idx` must be in-bounds
40+
unsafe { (&mut x as *mut T as *mut U).add(idx as usize).write(val) }
41+
x
42+
}
43+
44+
/// Extracts an element from a vector.
45+
///
46+
/// `T` must be a vector with element type `U`.
47+
///
48+
/// If the index is `const`, [`simd_extract`] may emit better assembly.
49+
///
50+
/// # Safety
51+
///
52+
/// `idx` must be in-bounds of the vector.
53+
#[rustc_nounwind]
54+
#[cfg_attr(not(bootstrap), rustc_intrinsic)]
55+
pub unsafe fn simd_extract_dyn<T, U>(x: T, idx: u32) -> U {
56+
// SAFETY: `idx` must be in-bounds
57+
unsafe { (&x as *const T as *const U).add(idx as usize).read() }
58+
}
59+
2760
/// Adds two simd vectors elementwise.
2861
///
2962
/// `T` must be a vector of integers or floats.
+83
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,83 @@
1+
//@compile-flags: -Copt-level=3 -Z merge-functions=disabled
2+
3+
#![feature(core_intrinsics, s390x_target_feature, repr_simd)]
4+
#![no_std]
5+
#![crate_type = "lib"]
6+
#![allow(non_camel_case_types)]
7+
8+
// test that `core::intrinsics::simd::{simd_extract_dyn, simd_insert_dyn}`
9+
// optimize to their dedicated instructions on platforms that support them.
10+
11+
use core::intrinsics::simd::{simd_extract, simd_extract_dyn, simd_insert, simd_insert_dyn};
12+
13+
#[repr(simd)]
14+
#[derive(Clone, Copy)]
15+
pub struct u32x16([u32; 16]);
16+
17+
#[repr(simd)]
18+
#[derive(Clone, Copy)]
19+
pub struct i8x16([i8; 16]);
20+
21+
// CHECK-LABEL: dyn_simd_extract
22+
// CHECK: extractelement <16 x i8> %x, i32 %idx
23+
// CHECK-NEXT: ret
24+
#[no_mangle]
25+
unsafe extern "C" fn dyn_simd_extract(x: i8x16, idx: u32) -> i8 {
26+
simd_extract_dyn(x, idx)
27+
}
28+
29+
// CHECK-LABEL: literal_dyn_simd_extract
30+
// CHECK: extractelement <16 x i8> %x, i64 7
31+
// CHECK-NEXT: ret
32+
#[no_mangle]
33+
unsafe extern "C" fn literal_dyn_simd_extract(x: i8x16) -> i8 {
34+
simd_extract_dyn(x, 7)
35+
}
36+
37+
// CHECK-LABEL: const_dyn_simd_extract
38+
// CHECK: extractelement <16 x i8> %x, i64 7
39+
// CHECK-NEXT: ret
40+
#[no_mangle]
41+
unsafe extern "C" fn const_dyn_simd_extract(x: i8x16) -> i8 {
42+
simd_extract_dyn(x, const { 3 + 4 })
43+
}
44+
45+
// CHECK-LABEL: const_simd_extract
46+
// CHECK: extractelement <16 x i8> %x, i64 7
47+
// CHECK-NEXT: ret
48+
#[no_mangle]
49+
unsafe extern "C" fn const_simd_extract(x: i8x16) -> i8 {
50+
simd_extract(x, const { 3 + 4 })
51+
}
52+
53+
// CHECK-LABEL: dyn_simd_insert
54+
// CHECK: insertelement <16 x i8> %x, i8 %e, i32 %idx
55+
// CHECK-NEXT: ret
56+
#[no_mangle]
57+
unsafe extern "C" fn dyn_simd_insert(x: i8x16, e: i8, idx: u32) -> i8x16 {
58+
simd_insert_dyn(x, idx, e)
59+
}
60+
61+
// CHECK-LABEL: literal_dyn_simd_insert
62+
// CHECK: insertelement <16 x i8> %x, i8 %e, i64 7
63+
// CHECK-NEXT: ret
64+
#[no_mangle]
65+
unsafe extern "C" fn literal_dyn_simd_insert(x: i8x16, e: i8) -> i8x16 {
66+
simd_insert_dyn(x, 7, e)
67+
}
68+
69+
// CHECK-LABEL: const_dyn_simd_insert
70+
// CHECK: insertelement <16 x i8> %x, i8 %e, i64 7
71+
// CHECK-NEXT: ret
72+
#[no_mangle]
73+
unsafe extern "C" fn const_dyn_simd_insert(x: i8x16, e: i8) -> i8x16 {
74+
simd_insert_dyn(x, const { 3 + 4 }, e)
75+
}
76+
77+
// CHECK-LABEL: const_simd_insert
78+
// CHECK: insertelement <16 x i8> %x, i8 %e, i64 7
79+
// CHECK-NEXT: ret
80+
#[no_mangle]
81+
unsafe extern "C" fn const_simd_insert(x: i8x16, e: i8) -> i8x16 {
82+
simd_insert(x, const { 3 + 4 }, e)
83+
}

tests/ui/simd/intrinsic/generic-elements-pass.rs

+39-2
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,10 @@
11
//@ run-pass
22

3-
#![feature(repr_simd, core_intrinsics)]
3+
#![feature(repr_simd, intrinsics, core_intrinsics)]
44

5-
use std::intrinsics::simd::{simd_extract, simd_insert, simd_shuffle};
5+
use std::intrinsics::simd::{
6+
simd_extract, simd_extract_dyn, simd_insert, simd_insert_dyn, simd_shuffle,
7+
};
68

79
#[repr(simd)]
810
#[derive(Copy, Clone, Debug, PartialEq)]
@@ -70,6 +72,41 @@ fn main() {
7072
all_eq!(simd_extract(x8, 6), 86);
7173
all_eq!(simd_extract(x8, 7), 87);
7274
}
75+
unsafe {
76+
all_eq!(simd_insert_dyn(x2, 0, 100), i32x2([100, 21]));
77+
all_eq!(simd_insert_dyn(x2, 1, 100), i32x2([20, 100]));
78+
79+
all_eq!(simd_insert_dyn(x4, 0, 100), i32x4([100, 41, 42, 43]));
80+
all_eq!(simd_insert_dyn(x4, 1, 100), i32x4([40, 100, 42, 43]));
81+
all_eq!(simd_insert_dyn(x4, 2, 100), i32x4([40, 41, 100, 43]));
82+
all_eq!(simd_insert_dyn(x4, 3, 100), i32x4([40, 41, 42, 100]));
83+
84+
all_eq!(simd_insert_dyn(x8, 0, 100), i32x8([100, 81, 82, 83, 84, 85, 86, 87]));
85+
all_eq!(simd_insert_dyn(x8, 1, 100), i32x8([80, 100, 82, 83, 84, 85, 86, 87]));
86+
all_eq!(simd_insert_dyn(x8, 2, 100), i32x8([80, 81, 100, 83, 84, 85, 86, 87]));
87+
all_eq!(simd_insert_dyn(x8, 3, 100), i32x8([80, 81, 82, 100, 84, 85, 86, 87]));
88+
all_eq!(simd_insert_dyn(x8, 4, 100), i32x8([80, 81, 82, 83, 100, 85, 86, 87]));
89+
all_eq!(simd_insert_dyn(x8, 5, 100), i32x8([80, 81, 82, 83, 84, 100, 86, 87]));
90+
all_eq!(simd_insert_dyn(x8, 6, 100), i32x8([80, 81, 82, 83, 84, 85, 100, 87]));
91+
all_eq!(simd_insert_dyn(x8, 7, 100), i32x8([80, 81, 82, 83, 84, 85, 86, 100]));
92+
93+
all_eq!(simd_extract_dyn(x2, 0), 20);
94+
all_eq!(simd_extract_dyn(x2, 1), 21);
95+
96+
all_eq!(simd_extract_dyn(x4, 0), 40);
97+
all_eq!(simd_extract_dyn(x4, 1), 41);
98+
all_eq!(simd_extract_dyn(x4, 2), 42);
99+
all_eq!(simd_extract_dyn(x4, 3), 43);
100+
101+
all_eq!(simd_extract_dyn(x8, 0), 80);
102+
all_eq!(simd_extract_dyn(x8, 1), 81);
103+
all_eq!(simd_extract_dyn(x8, 2), 82);
104+
all_eq!(simd_extract_dyn(x8, 3), 83);
105+
all_eq!(simd_extract_dyn(x8, 4), 84);
106+
all_eq!(simd_extract_dyn(x8, 5), 85);
107+
all_eq!(simd_extract_dyn(x8, 6), 86);
108+
all_eq!(simd_extract_dyn(x8, 7), 87);
109+
}
73110

74111
let y2 = i32x2([120, 121]);
75112
let y4 = i32x4([140, 141, 142, 143]);

0 commit comments

Comments
 (0)