cpu_asimd.c
1 #ifdef _MSC_VER 2 #include <Intrin.h> 3 #endif 4 #include <arm_neon.h> 5 6 int main(int argc, char **argv) 7 { 8 float *src = (float*)argv[argc-1]; 9 float32x4_t v1 = vdupq_n_f32(src[0]), v2 = vdupq_n_f32(src[1]); 10 /* MAXMIN */ 11 int ret = (int)vgetq_lane_f32(vmaxnmq_f32(v1, v2), 0); 12 ret += (int)vgetq_lane_f32(vminnmq_f32(v1, v2), 0); 13 /* ROUNDING */ 14 ret += (int)vgetq_lane_f32(vrndq_f32(v1), 0); 15 #ifdef __aarch64__ 16 { 17 double *src2 = (double*)argv[argc-1]; 18 float64x2_t vd1 = vdupq_n_f64(src2[0]), vd2 = vdupq_n_f64(src2[1]); 19 /* MAXMIN */ 20 ret += (int)vgetq_lane_f64(vmaxnmq_f64(vd1, vd2), 0); 21 ret += (int)vgetq_lane_f64(vminnmq_f64(vd1, vd2), 0); 22 /* ROUNDING */ 23 ret += (int)vgetq_lane_f64(vrndq_f64(vd1), 0); 24 } 25 #endif 26 return ret; 27 }