pub fn decode_u8x32<S: SIMD256>(s: S, a: S::V256) -> Result<S::V128, ()>