Lines Matching refs:v5
63 ld1 {v5.8H}, [x16], #16 // load 8x16-bit filter values, part 1
67 smlal v0.4S, v4.4H, v5.4H // v0 accumulates srcp[filterPos[0] + {0..3}] * filter[{0..3}]
68 smlal2 v0.4S, v4.8H, v5.8H // v0 accumulates srcp[filterPos[0] + {4..7}] * filter[{4..7}]
106 // v5 madd accumulator 4S
150 movi v5.2D, #0 // Clear madd accumulator for idx 4..7
175 smlal2 v5.4S, v1.8H, v16.8H // multiply accumulate inner loop j = 0, idx = 4..7
176 smlal2 v5.4S, v2.8H, v17.8H // multiply accumulate inner loop j = 1, idx = 4..7
179 smlal2 v5.4S, v3.8H, v18.8H // multiply accumulate inner loop j = 2, idx = 4..7
180 smlal2 v5.4S, v4.8H, v19.8H // multiply accumulate inner loop j = 3, idx = 4..7
186 sqshrn v1.4H, v5.4S, #7 // shift and clip the 2x16-bit final values
196 movi v5.2D, #0 // Clear madd accumulator for idx 4..7
208 smlal2 v5.4S, v1.8H, v16.8H // multiply accumulate inner loop j = 0, idx = 4..7
209 smlal2 v5.4S, v2.8H, v17.8H // multiply accumulate inner loop j = 1, idx = 4..7
210 smlal2 v5.4S, v3.8H, v18.8H // multiply accumulate inner loop j = 2, idx = 4..7
211 smlal2 v5.4S, v4.8H, v19.8H // multiply accumulate inner loop j = 3, idx = 4..7
215 sqshrn v1.4H, v5.4S, #7 // shift and clip the 2x16-bit final values
228 ld1 {v5.S}[0], [x9] // src[filterPos[i] + 0..3]
232 uxtl v5.8H, v5.8B // unsigned exten long, convert src data to 16-bit
233 smull v0.4S, v5.4H, v6.4H // 4 iterations of src[...] * filter[...]