Auto merge of #3237 - RalfJung:simd-loadstore, r=RalfJung

implement and test simd_masked_load and simd_masked_store

also extend the scatter/gather tests

Fixes https://github.com/rust-lang/miri/issues/3235
This commit is contained in:
bors 2023-12-22 11:29:56 +00:00
commit 2c7e0fd373
2 changed files with 111 additions and 6 deletions

View File

@ -656,6 +656,54 @@ pub trait EvalContextExt<'mir, 'tcx: 'mir>: crate::MiriInterpCxExt<'mir, 'tcx> {
}
}
}
"masked_load" => {
let [mask, ptr, default] = check_arg_count(args)?;
let (mask, mask_len) = this.operand_to_simd(mask)?;
let ptr = this.read_pointer(ptr)?;
let (default, default_len) = this.operand_to_simd(default)?;
let (dest, dest_len) = this.place_to_simd(dest)?;
assert_eq!(dest_len, mask_len);
assert_eq!(dest_len, default_len);
for i in 0..dest_len {
let mask = this.read_immediate(&this.project_index(&mask, i)?)?;
let default = this.read_immediate(&this.project_index(&default, i)?)?;
let dest = this.project_index(&dest, i)?;
let val = if simd_element_to_bool(mask)? {
// Size * u64 is implemented as always checked
#[allow(clippy::arithmetic_side_effects)]
let ptr = ptr.wrapping_offset(dest.layout.size * i, this);
let place = this.ptr_to_mplace(ptr, dest.layout);
this.read_immediate(&place)?
} else {
default
};
this.write_immediate(*val, &dest)?;
}
}
"masked_store" => {
let [mask, ptr, vals] = check_arg_count(args)?;
let (mask, mask_len) = this.operand_to_simd(mask)?;
let ptr = this.read_pointer(ptr)?;
let (vals, vals_len) = this.operand_to_simd(vals)?;
assert_eq!(mask_len, vals_len);
for i in 0..vals_len {
let mask = this.read_immediate(&this.project_index(&mask, i)?)?;
let val = this.read_immediate(&this.project_index(&vals, i)?)?;
if simd_element_to_bool(mask)? {
// Size * u64 is implemented as always checked
#[allow(clippy::arithmetic_side_effects)]
let ptr = ptr.wrapping_offset(val.layout.size * i, this);
let place = this.ptr_to_mplace(ptr, val.layout);
this.write_immediate(*val, &place)?
};
}
}
name => throw_unsup_format!("unimplemented intrinsic: `simd_{name}`"),
}

View File

@ -1,6 +1,8 @@
//@compile-flags: -Zmiri-strict-provenance
#![feature(portable_simd, platform_intrinsics, adt_const_params, inline_const)]
#![feature(portable_simd, platform_intrinsics, adt_const_params, inline_const, core_intrinsics)]
#![allow(incomplete_features, internal_features)]
use std::intrinsics::simd as intrinsics;
use std::ptr;
use std::simd::{prelude::*, StdFloat};
fn simd_ops_f32() {
@ -421,6 +423,40 @@ fn simd_gather_scatter() {
let idxs = Simd::from_array([9, 3, 0, 0]);
Simd::from_array([-27, 82, -41, 124]).scatter(&mut vec, idxs);
assert_eq!(vec, vec![124, 11, 12, 82, 14, 15, 16, 17, 18]);
// We call the intrinsics directly to experiment with dangling pointers and masks.
let val = 42u8;
let ptrs: Simd<*const u8, 4> =
Simd::from_array([ptr::null(), ptr::addr_of!(val), ptr::addr_of!(val), ptr::addr_of!(val)]);
let default = u8x4::splat(0);
let mask = i8x4::from_array([0, !0, 0, !0]);
let vals = unsafe { intrinsics::simd_gather(default, ptrs, mask) };
assert_eq!(vals, u8x4::from_array([0, 42, 0, 42]),);
let mut val1 = 0u8;
let mut val2 = 0u8;
let ptrs: Simd<*mut u8, 4> = Simd::from_array([
ptr::null_mut(),
ptr::addr_of_mut!(val1),
ptr::addr_of_mut!(val1),
ptr::addr_of_mut!(val2),
]);
let vals = u8x4::from_array([1, 2, 3, 4]);
unsafe { intrinsics::simd_scatter(vals, ptrs, mask) };
assert_eq!(val1, 2);
assert_eq!(val2, 4);
// Also check what happens when `scatter` has multiple overlapping pointers.
let mut val = 0u8;
let ptrs: Simd<*mut u8, 4> = Simd::from_array([
ptr::addr_of_mut!(val),
ptr::addr_of_mut!(val),
ptr::addr_of_mut!(val),
ptr::addr_of_mut!(val),
]);
let vals = u8x4::from_array([1, 2, 3, 4]);
unsafe { intrinsics::simd_scatter(vals, ptrs, mask) };
assert_eq!(val, 4);
}
fn simd_round() {
@ -460,14 +496,11 @@ fn simd_round() {
}
fn simd_intrinsics() {
use intrinsics::*;
extern "platform-intrinsic" {
fn simd_eq<T, U>(x: T, y: T) -> U;
fn simd_reduce_any<T>(x: T) -> bool;
fn simd_reduce_all<T>(x: T) -> bool;
fn simd_select<M, T>(m: M, yes: T, no: T) -> T;
fn simd_shuffle_generic<T, U, const IDX: &'static [u32]>(x: T, y: T) -> U;
fn simd_shuffle<T, IDX, U>(x: T, y: T, idx: IDX) -> U;
}
unsafe {
// Make sure simd_eq returns all-1 for `true`
let a = i32x4::splat(10);
@ -503,6 +536,29 @@ fn simd_intrinsics() {
}
}
fn simd_masked_loadstore() {
// The buffer is deliberarely too short, so reading the last element would be UB.
let buf = [3i32; 3];
let default = i32x4::splat(0);
let mask = i32x4::from_array([!0, !0, !0, 0]);
let vals = unsafe { intrinsics::simd_masked_load(mask, buf.as_ptr(), default) };
assert_eq!(vals, i32x4::from_array([3, 3, 3, 0]));
// Also read in a way that the *first* element is OOB.
let mask2 = i32x4::from_array([0, !0, !0, !0]);
let vals =
unsafe { intrinsics::simd_masked_load(mask2, buf.as_ptr().wrapping_sub(1), default) };
assert_eq!(vals, i32x4::from_array([0, 3, 3, 3]));
// The buffer is deliberarely too short, so writing the last element would be UB.
let mut buf = [42i32; 3];
let vals = i32x4::from_array([1, 2, 3, 4]);
unsafe { intrinsics::simd_masked_store(mask, buf.as_mut_ptr(), vals) };
assert_eq!(buf, [1, 2, 3]);
// Also write in a way that the *first* element is OOB.
unsafe { intrinsics::simd_masked_store(mask2, buf.as_mut_ptr().wrapping_sub(1), vals) };
assert_eq!(buf, [2, 3, 4]);
}
fn main() {
simd_mask();
simd_ops_f32();
@ -513,4 +569,5 @@ fn main() {
simd_gather_scatter();
simd_round();
simd_intrinsics();
simd_masked_loadstore();
}