unsafe extern "C" fn expandloadps_256( mem_addr: *const f32, a: Simd<f32, 8>, mask: u8, ) -> Simd<f32, 8>