File: //lib/python3/dist-packages/numpy/distutils/checks/cpu_neon_vfpv4.c
#ifdef _MSC_VER
    #include <Intrin.h>
#endif
#include <arm_neon.h>
int main(void)
{
    float32x4_t v1 = vdupq_n_f32(1.0f);
    float32x4_t v2 = vdupq_n_f32(2.0f);
    float32x4_t v3 = vdupq_n_f32(3.0f);
    int ret = (int)vgetq_lane_f32(vfmaq_f32(v1, v2, v3), 0);
#ifdef __aarch64__
    float64x2_t vd1 = vdupq_n_f64(1.0);
    float64x2_t vd2 = vdupq_n_f64(2.0);
    float64x2_t vd3 = vdupq_n_f64(3.0);
    ret += (int)vgetq_lane_f64(vfmaq_f64(vd1, vd2, vd3), 0);
#endif
    return ret;
}