pub fn crsa16(a: usize, b: usize) -> usize
stdsimd
Cross subtracts and adds packed 16-bit signed numbers, discarding overflow bits