Lines Matching refs:val
145 posSamp.val[0] = vrev64q_s16(posSamp.val[0]); in ProcessNeonIntrinsic()
146 posSamp.val[1] = vrev64q_s16(posSamp.val[1]); in ProcessNeonIntrinsic()
149 accum = vmlal_s16(accum, vget_low_s16(posSamp.val[0]), vget_high_s16(posCoef)); // r in ProcessNeonIntrinsic()
150 accum = vmlal_s16(accum, vget_high_s16(posSamp.val[0]), vget_low_s16(posCoef)); // r in ProcessNeonIntrinsic()
151 accum2 = vmlal_s16(accum2, vget_low_s16(posSamp.val[1]), vget_high_s16(posCoef)); // r in ProcessNeonIntrinsic()
152 accum2 = vmlal_s16(accum2, vget_high_s16(posSamp.val[1]), vget_low_s16(posCoef)); // r in ProcessNeonIntrinsic()
153 accum = vmlal_s16(accum, vget_low_s16(negSamp.val[0]), vget_low_s16(negCoef)); in ProcessNeonIntrinsic()
154 accum = vmlal_s16(accum, vget_high_s16(negSamp.val[0]), vget_high_s16(negCoef)); in ProcessNeonIntrinsic()
155 accum2 = vmlal_s16(accum2, vget_low_s16(negSamp.val[1]), vget_low_s16(negCoef)); in ProcessNeonIntrinsic()
156 accum2 = vmlal_s16(accum2, vget_high_s16(negSamp.val[1]), vget_high_s16(negCoef)); in ProcessNeonIntrinsic()
222 posCoef.val[0] = vld1q_s32(coefsP); in ProcessNeonIntrinsic()
224 posCoef.val[1] = vld1q_s32(coefsP); in ProcessNeonIntrinsic()
227 negCoef.val[0] = vld1q_s32(coefsN); in ProcessNeonIntrinsic()
229 negCoef.val[1] = vld1q_s32(coefsN); in ProcessNeonIntrinsic()
240 posCoef1.val[0] = vld1q_s32(coefsP1); in ProcessNeonIntrinsic()
242 posCoef1.val[1] = vld1q_s32(coefsP1); in ProcessNeonIntrinsic()
245 negCoef1.val[0] = vld1q_s32(coefsN1); in ProcessNeonIntrinsic()
247 negCoef1.val[1] = vld1q_s32(coefsN1); in ProcessNeonIntrinsic()
251 posCoef1.val[0] = vsubq_s32(posCoef1.val[0], posCoef.val[0]); in ProcessNeonIntrinsic()
252 posCoef1.val[1] = vsubq_s32(posCoef1.val[1], posCoef.val[1]); in ProcessNeonIntrinsic()
253 negCoef.val[0] = vsubq_s32(negCoef.val[0], negCoef1.val[0]); in ProcessNeonIntrinsic()
254 negCoef.val[1] = vsubq_s32(negCoef.val[1], negCoef1.val[1]); in ProcessNeonIntrinsic()
256 posCoef1.val[0] = vqrdmulhq_lane_s32(posCoef1.val[0], interp, 0); in ProcessNeonIntrinsic()
257 posCoef1.val[1] = vqrdmulhq_lane_s32(posCoef1.val[1], interp, 0); in ProcessNeonIntrinsic()
258 negCoef.val[0] = vqrdmulhq_lane_s32(negCoef.val[0], interp, 0); in ProcessNeonIntrinsic()
259 negCoef.val[1] = vqrdmulhq_lane_s32(negCoef.val[1], interp, 0); in ProcessNeonIntrinsic()
261 posCoef.val[0] = vaddq_s32(posCoef.val[0], posCoef1.val[0]); in ProcessNeonIntrinsic()
262 posCoef.val[1] = vaddq_s32(posCoef.val[1], posCoef1.val[1]); in ProcessNeonIntrinsic()
263 negCoef.val[0] = vaddq_s32(negCoef.val[0], negCoef1.val[0]); in ProcessNeonIntrinsic()
264 negCoef.val[1] = vaddq_s32(negCoef.val[1], negCoef1.val[1]); in ProcessNeonIntrinsic()
279 posSamp0 = vqrdmulhq_s32(posSamp0, posCoef.val[1]); // reversed in ProcessNeonIntrinsic()
280 posSamp1 = vqrdmulhq_s32(posSamp1, posCoef.val[0]); // reversed in ProcessNeonIntrinsic()
281 negSamp0 = vqrdmulhq_s32(negSamp0, negCoef.val[0]); in ProcessNeonIntrinsic()
282 negSamp1 = vqrdmulhq_s32(negSamp1, negCoef.val[1]); in ProcessNeonIntrinsic()
295 posSamp.val[0] = vrev64q_s16(posSamp.val[0]); in ProcessNeonIntrinsic()
296 posSamp.val[1] = vrev64q_s16(posSamp.val[1]); in ProcessNeonIntrinsic()
299 int32x4_t posSamp0 = vshll_n_s16(vget_low_s16(posSamp.val[0]), 15); in ProcessNeonIntrinsic()
300 int32x4_t posSamp1 = vshll_n_s16(vget_high_s16(posSamp.val[0]), 15); in ProcessNeonIntrinsic()
301 int32x4_t negSamp0 = vshll_n_s16(vget_low_s16(negSamp.val[0]), 15); in ProcessNeonIntrinsic()
302 int32x4_t negSamp1 = vshll_n_s16(vget_high_s16(negSamp.val[0]), 15); in ProcessNeonIntrinsic()
305 posSamp0 = vqrdmulhq_s32(posSamp0, posCoef.val[1]); // reversed in ProcessNeonIntrinsic()
306 posSamp1 = vqrdmulhq_s32(posSamp1, posCoef.val[0]); // reversed in ProcessNeonIntrinsic()
307 negSamp0 = vqrdmulhq_s32(negSamp0, negCoef.val[0]); in ProcessNeonIntrinsic()
308 negSamp1 = vqrdmulhq_s32(negSamp1, negCoef.val[1]); in ProcessNeonIntrinsic()
316 posSamp0 = vshll_n_s16(vget_low_s16(posSamp.val[1]), 15); in ProcessNeonIntrinsic()
317 posSamp1 = vshll_n_s16(vget_high_s16(posSamp.val[1]), 15); in ProcessNeonIntrinsic()
318 negSamp0 = vshll_n_s16(vget_low_s16(negSamp.val[1]), 15); in ProcessNeonIntrinsic()
319 negSamp1 = vshll_n_s16(vget_high_s16(negSamp.val[1]), 15); in ProcessNeonIntrinsic()
322 posSamp0 = vqrdmulhq_s32(posSamp0, posCoef.val[1]); // reversed in ProcessNeonIntrinsic()
323 posSamp1 = vqrdmulhq_s32(posSamp1, posCoef.val[0]); // reversed in ProcessNeonIntrinsic()
324 negSamp0 = vqrdmulhq_s32(negSamp0, negCoef.val[0]); in ProcessNeonIntrinsic()
325 negSamp1 = vqrdmulhq_s32(negSamp1, negCoef.val[1]); in ProcessNeonIntrinsic()
397 posCoef.val[0] = vld1q_f32(coefsP); in ProcessNeonIntrinsic()
399 posCoef.val[1] = vld1q_f32(coefsP); in ProcessNeonIntrinsic()
402 negCoef.val[0] = vld1q_f32(coefsN); in ProcessNeonIntrinsic()
404 negCoef.val[1] = vld1q_f32(coefsN); in ProcessNeonIntrinsic()
415 posCoef1.val[0] = vld1q_f32(coefsP1); in ProcessNeonIntrinsic()
417 posCoef1.val[1] = vld1q_f32(coefsP1); in ProcessNeonIntrinsic()
420 negCoef1.val[0] = vld1q_f32(coefsN1); in ProcessNeonIntrinsic()
422 negCoef1.val[1] = vld1q_f32(coefsN1); in ProcessNeonIntrinsic()
425 posCoef1.val[0] = vsubq_f32(posCoef1.val[0], posCoef.val[0]); in ProcessNeonIntrinsic()
426 posCoef1.val[1] = vsubq_f32(posCoef1.val[1], posCoef.val[1]); in ProcessNeonIntrinsic()
427 negCoef.val[0] = vsubq_f32(negCoef.val[0], negCoef1.val[0]); in ProcessNeonIntrinsic()
428 negCoef.val[1] = vsubq_f32(negCoef.val[1], negCoef1.val[1]); in ProcessNeonIntrinsic()
430 posCoef.val[0] = vmlaq_lane_f32(posCoef.val[0], posCoef1.val[0], interp, 0); in ProcessNeonIntrinsic()
431 posCoef.val[1] = vmlaq_lane_f32(posCoef.val[1], posCoef1.val[1], interp, 0); in ProcessNeonIntrinsic()
432 negCoef.val[0] = vmlaq_lane_f32(negCoef1.val[0], negCoef.val[0], interp, 0); // rev in ProcessNeonIntrinsic()
433 negCoef.val[1] = vmlaq_lane_f32(negCoef1.val[1], negCoef.val[1], interp, 0); // rev in ProcessNeonIntrinsic()
444 posSamp.val[0] = vld1q_f32(sP); in ProcessNeonIntrinsic()
446 posSamp.val[1] = vld1q_f32(sP); in ProcessNeonIntrinsic()
449 negSamp.val[0] = vld1q_f32(sN); in ProcessNeonIntrinsic()
451 negSamp.val[1] = vld1q_f32(sN); in ProcessNeonIntrinsic()
455 posSamp.val[0] = vrev64q_f32(posSamp.val[0]); in ProcessNeonIntrinsic()
456 posSamp.val[1] = vrev64q_f32(posSamp.val[1]); in ProcessNeonIntrinsic()
457 posSamp.val[0] = vcombine_f32( in ProcessNeonIntrinsic()
458 vget_high_f32(posSamp.val[0]), vget_low_f32(posSamp.val[0])); in ProcessNeonIntrinsic()
459 posSamp.val[1] = vcombine_f32( in ProcessNeonIntrinsic()
460 vget_high_f32(posSamp.val[1]), vget_low_f32(posSamp.val[1])); in ProcessNeonIntrinsic()
462 accum = vmlaq_f32(accum, posSamp.val[0], posCoef.val[1]); in ProcessNeonIntrinsic()
463 accum = vmlaq_f32(accum, posSamp.val[1], posCoef.val[0]); in ProcessNeonIntrinsic()
464 accum = vmlaq_f32(accum, negSamp.val[0], negCoef.val[0]); in ProcessNeonIntrinsic()
465 accum = vmlaq_f32(accum, negSamp.val[1], negCoef.val[1]); in ProcessNeonIntrinsic()
472 posSamp0.val[0] = vrev64q_f32(posSamp0.val[0]); in ProcessNeonIntrinsic()
473 posSamp0.val[1] = vrev64q_f32(posSamp0.val[1]); in ProcessNeonIntrinsic()
474 posSamp0.val[0] = vcombine_f32( in ProcessNeonIntrinsic()
475 vget_high_f32(posSamp0.val[0]), vget_low_f32(posSamp0.val[0])); in ProcessNeonIntrinsic()
476 posSamp0.val[1] = vcombine_f32( in ProcessNeonIntrinsic()
477 vget_high_f32(posSamp0.val[1]), vget_low_f32(posSamp0.val[1])); in ProcessNeonIntrinsic()
483 posSamp1.val[0] = vrev64q_f32(posSamp1.val[0]); in ProcessNeonIntrinsic()
484 posSamp1.val[1] = vrev64q_f32(posSamp1.val[1]); in ProcessNeonIntrinsic()
485 posSamp1.val[0] = vcombine_f32( in ProcessNeonIntrinsic()
486 vget_high_f32(posSamp1.val[0]), vget_low_f32(posSamp1.val[0])); in ProcessNeonIntrinsic()
487 posSamp1.val[1] = vcombine_f32( in ProcessNeonIntrinsic()
488 vget_high_f32(posSamp1.val[1]), vget_low_f32(posSamp1.val[1])); in ProcessNeonIntrinsic()
494 accum = vmlaq_f32(accum, negSamp0.val[0], negCoef.val[0]); in ProcessNeonIntrinsic()
495 accum = vmlaq_f32(accum, negSamp1.val[0], negCoef.val[1]); in ProcessNeonIntrinsic()
496 accum2 = vmlaq_f32(accum2, negSamp0.val[1], negCoef.val[0]); in ProcessNeonIntrinsic()
497 accum2 = vmlaq_f32(accum2, negSamp1.val[1], negCoef.val[1]); in ProcessNeonIntrinsic()
499 accum = vmlaq_f32(accum, posSamp0.val[0], posCoef.val[1]); // reversed in ProcessNeonIntrinsic()
500 accum = vmlaq_f32(accum, posSamp1.val[0], posCoef.val[0]); // reversed in ProcessNeonIntrinsic()
501 accum2 = vmlaq_f32(accum2, posSamp0.val[1], posCoef.val[1]); // reversed in ProcessNeonIntrinsic()
502 accum2 = vmlaq_f32(accum2, posSamp1.val[1], posCoef.val[0]); // reversed in ProcessNeonIntrinsic()