cpu_asimdfhm.c 529 B

12345678910111213141516171819
  1. #ifdef _MSC_VER
  2. #include <Intrin.h>
  3. #endif
  4. #include <arm_neon.h>
  5. int main(int argc, char **argv)
  6. {
  7. float16_t *src = (float16_t*)argv[argc-1];
  8. float *src2 = (float*)argv[argc-2];
  9. float16x8_t vhp = vdupq_n_f16(src[0]);
  10. float16x4_t vlhp = vdup_n_f16(src[1]);
  11. float32x4_t vf = vdupq_n_f32(src2[0]);
  12. float32x2_t vlf = vdup_n_f32(src2[1]);
  13. int ret = (int)vget_lane_f32(vfmlal_low_f16(vlf, vlhp, vlhp), 0);
  14. ret += (int)vgetq_lane_f32(vfmlslq_high_f16(vf, vhp, vhp), 0);
  15. return ret;
  16. }