unsafe extern "C" fn cvtneps2bf16_128( a: Simd<f32, 4>, src: Simd<i16, 8>, k: __mmask8, ) -> Simd<i16, 8>