1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
| #ifdef _MSC_VER
| #include <Intrin.h>
| #endif
| #include <arm_neon.h>
|
| int main(int argc, char **argv)
| {
| float *src = (float*)argv[argc-1];
| float32x4_t v1 = vdupq_n_f32(src[0]), v2 = vdupq_n_f32(src[1]);
| /* MAXMIN */
| int ret = (int)vgetq_lane_f32(vmaxnmq_f32(v1, v2), 0);
| ret += (int)vgetq_lane_f32(vminnmq_f32(v1, v2), 0);
| /* ROUNDING */
| ret += (int)vgetq_lane_f32(vrndq_f32(v1), 0);
| #ifdef __aarch64__
| {
| double *src2 = (double*)argv[argc-1];
| float64x2_t vd1 = vdupq_n_f64(src2[0]), vd2 = vdupq_n_f64(src2[1]);
| /* MAXMIN */
| ret += (int)vgetq_lane_f64(vmaxnmq_f64(vd1, vd2), 0);
| ret += (int)vgetq_lane_f64(vminnmq_f64(vd1, vd2), 0);
| /* ROUNDING */
| ret += (int)vgetq_lane_f64(vrndq_f64(vd1), 0);
| }
| #endif
| return ret;
| }
|
|