unsafe extern "C" fn vgatherdps_128( src: Simd<f32, 4>, slice: *const u8, offsets: Simd<i32, 4>, k: u8, scale: i32, ) -> Simd<f32, 4>