File size: 818 Bytes
6370773
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
#ifdef _MSC_VER
    #include <Intrin.h>
#endif
#include <arm_neon.h>

int main(int argc, char **argv)
{
    float *src = (float*)argv[argc-1];
    float32x4_t v1 = vdupq_n_f32(src[0]), v2 = vdupq_n_f32(src[1]);
    /* MAXMIN */
    int ret  = (int)vgetq_lane_f32(vmaxnmq_f32(v1, v2), 0);
        ret += (int)vgetq_lane_f32(vminnmq_f32(v1, v2), 0);
    /* ROUNDING */
    ret += (int)vgetq_lane_f32(vrndq_f32(v1), 0);
#ifdef __aarch64__
    {
        double *src2 = (double*)argv[argc-1];
        float64x2_t vd1 = vdupq_n_f64(src2[0]), vd2 = vdupq_n_f64(src2[1]);
        /* MAXMIN */
        ret += (int)vgetq_lane_f64(vmaxnmq_f64(vd1, vd2), 0);
        ret += (int)vgetq_lane_f64(vminnmq_f64(vd1, vd2), 0);
        /* ROUNDING */
        ret += (int)vgetq_lane_f64(vrndq_f64(vd1), 0);
    }
#endif
    return ret;
}