20 lines
529 B
C
20 lines
529 B
C
|
#ifdef _MSC_VER
|
||
|
#include <Intrin.h>
|
||
|
#endif
|
||
|
#include <arm_neon.h>
|
||
|
|
||
|
int main(int argc, char **argv)
|
||
|
{
|
||
|
float16_t *src = (float16_t*)argv[argc-1];
|
||
|
float *src2 = (float*)argv[argc-2];
|
||
|
float16x8_t vhp = vdupq_n_f16(src[0]);
|
||
|
float16x4_t vlhp = vdup_n_f16(src[1]);
|
||
|
float32x4_t vf = vdupq_n_f32(src2[0]);
|
||
|
float32x2_t vlf = vdup_n_f32(src2[1]);
|
||
|
|
||
|
int ret = (int)vget_lane_f32(vfmlal_low_f16(vlf, vlhp, vlhp), 0);
|
||
|
ret += (int)vgetq_lane_f32(vfmlslq_high_f16(vf, vhp, vhp), 0);
|
||
|
|
||
|
return ret;
|
||
|
}
|