pub fn pkbt16(a: usize, b: usize) -> usize
stdsimd
Pack two 16-bit data from bottom and top half from 32-bit chunks