pub fn sra16(a: usize, b: u32) -> usize
stdsimd
Arithmetic right shift packed 16-bit elements without rounding up