unsafe extern "C" fn vpdpbuud_256( src: Simd<i32, 8>, a: Simd<u8, 32>, b: Simd<u8, 32>, ) -> Simd<i32, 8>