Skip to content

Commit dab8395

Browse files
committed
Implement simd_masked_store
1 parent c7b4e03 commit dab8395

File tree

2 files changed

+31
-1
lines changed

2 files changed

+31
-1
lines changed

scripts/test_rustc_tests.sh

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,6 @@ rm tests/ui/proc-macro/no-mangle-in-proc-macro-issue-111888.rs
4444
# vendor intrinsics
4545
rm tests/ui/sse2.rs # CodegenBackend::target_features not yet implemented
4646
rm tests/ui/simd/array-type.rs # "Index argument for `simd_insert` is not a constant"
47-
rm tests/ui/simd/masked-load-store.rs
4847

4948
# exotic linkages
5049
rm tests/ui/issues/issue-33992.rs # unsupported linkages

src/intrinsics/simd.rs

Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -962,6 +962,37 @@ pub(super) fn codegen_simd_intrinsic_call<'tcx>(
962962
}
963963
}
964964

965+
sym::simd_masked_store => {
966+
intrinsic_args!(fx, args => (mask, ptr, val); intrinsic);
967+
968+
let (val_lane_count, val_lane_ty) = val.layout().ty.simd_size_and_type(fx.tcx);
969+
let (mask_lane_count, _mask_lane_ty) = mask.layout().ty.simd_size_and_type(fx.tcx);
970+
assert_eq!(val_lane_count, mask_lane_count);
971+
let lane_clif_ty = fx.clif_type(val_lane_ty).unwrap();
972+
let ptr_val = ptr.load_scalar(fx);
973+
974+
for lane_idx in 0..val_lane_count {
975+
let val_lane = val.value_lane(fx, lane_idx).load_scalar(fx);
976+
let mask_lane = mask.value_lane(fx, lane_idx).load_scalar(fx);
977+
978+
let if_enabled = fx.bcx.create_block();
979+
let next = fx.bcx.create_block();
980+
981+
fx.bcx.ins().brif(mask_lane, if_enabled, &[], next, &[]);
982+
fx.bcx.seal_block(if_enabled);
983+
984+
fx.bcx.switch_to_block(if_enabled);
985+
let offset = lane_idx as i32 * lane_clif_ty.bytes() as i32;
986+
fx.bcx.ins().store(MemFlags::trusted(), val_lane, ptr_val, Offset32::new(offset));
987+
fx.bcx.ins().jump(next, &[]);
988+
989+
fx.bcx.seal_block(next);
990+
fx.bcx.switch_to_block(next);
991+
992+
fx.bcx.ins().nop();
993+
}
994+
}
995+
965996
sym::simd_gather => {
966997
intrinsic_args!(fx, args => (val, ptr, mask); intrinsic);
967998

0 commit comments

Comments
 (0)