/third_party/skia/src/opts/ |
H A D | SkBitmapProcState_opts.h | 53 const uint32_t* row0 = s.fPixmap.addr32(0,y0); in S32_alpha_D32_filter_DX() local 82 skvx::Vec<8,uint32_t> tl = gather(row0, x0), tr = gather(row0, x1), in S32_alpha_D32_filter_DX() 240 auto row0 = (const uint32_t*)((const uint8_t*)s.fPixmap.addr() + y0 * s.fPixmap.rowBytes()), in S32_alpha_D32_filter_DX() local 268 __m128i AB = interpolate_in_x_and_y(row0[x0[A]], row0[x1[A]], in S32_alpha_D32_filter_DX() 270 row0[x0[B]], row0[x1[B]], in S32_alpha_D32_filter_DX() 275 __m128i CD = interpolate_in_x_and_y(row0[x0[C]], row0[x in S32_alpha_D32_filter_DX() 323 auto row0 = (const uint32_t*)( (const char*)s.fPixmap.addr() + y0 * s.fPixmap.rowBytes() ), S32_alpha_D32_filter_DX() local 485 auto row0 = (const uint32_t*)( (const char*)s.fPixmap.addr() + y0 * s.fPixmap.rowBytes() ), S32_alpha_D32_filter_DX() local 520 auto row0 = (const uint32_t*)(src + y0*rb), S32_alpha_D32_filter_DXDY() local [all...] |
/third_party/skia/third_party/externals/libjpeg-turbo/simd/arm/ |
H A D | jquanti-neon.c | 57 int16x8_t row0 = in jsimd_convsamp_neon() local 74 vst1q_s16(workspace + 0 * DCTSIZE, row0); in jsimd_convsamp_neon() 105 int16x8_t row0 = vld1q_s16(workspace + (i + 0) * DCTSIZE); in jsimd_quantize_neon() local 124 int16x8_t sign_row0 = vshrq_n_s16(row0, 15); in jsimd_quantize_neon() 129 uint16x8_t abs_row0 = vreinterpretq_u16_s16(vabsq_s16(row0)); in jsimd_quantize_neon() 157 row0 = vcombine_s16(vshrn_n_s32(row0_l, 16), vshrn_n_s32(row0_h, 16)); in jsimd_quantize_neon() 165 row0 = vreinterpretq_s16_u16(vshlq_u16(vreinterpretq_u16_s16(row0), in jsimd_quantize_neon() 175 row0 = veorq_s16(row0, sign_row in jsimd_quantize_neon() [all...] |
H A D | jidctred-neon.c | 82 int16x8_t row0 = vld1q_s16(coef_block + 0 * DCTSIZE); in jsimd_idct_2x2_neon() local 96 row0 = vmulq_s16(row0, quant_row0); in jsimd_idct_2x2_neon() 105 /* Pass 1: process columns from input, put results in vectors row0 and in jsimd_idct_2x2_neon() 110 int32x4_t tmp10_l = vshll_n_s16(vget_low_s16(row0), CONST_BITS + 2); in jsimd_idct_2x2_neon() 111 int32x4_t tmp10_h = vshll_n_s16(vget_high_s16(row0), CONST_BITS + 2); in jsimd_idct_2x2_neon() 124 row0 = vcombine_s16(vrshrn_n_s32(vaddq_s32(tmp10_l, tmp0_l), CONST_BITS), in jsimd_idct_2x2_neon() 130 int16x8x2_t cols_0246_1357 = vtrnq_s16(row0, row1); in jsimd_idct_2x2_neon() 202 int16x8_t row0 = vld1q_s16(coef_block + 0 * DCTSIZE); in jsimd_idct_4x4_neon() local 213 row0 in jsimd_idct_4x4_neon() [all...] |
H A D | jidctint-neon.c | 97 static INLINE void jsimd_idct_islow_pass1_regular(int16x4_t row0, 116 static INLINE void jsimd_idct_islow_pass1_sparse(int16x4_t row0, 201 int16x4_t row0 = vld1_s16(coef_block + 0 * DCTSIZE); in jsimd_idct_islow_neon() local 233 int16x4_t dcval = vshl_n_s16(vmul_s16(row0, quant_row0), PASS1_BITS); in jsimd_idct_islow_neon() 239 jsimd_idct_islow_pass1_sparse(row0, row1, row2, row3, quant_row0, in jsimd_idct_islow_neon() 244 jsimd_idct_islow_pass1_regular(row0, row1, row2, row3, row4, row5, in jsimd_idct_islow_neon() 254 row0 = vld1_s16(coef_block + 0 * DCTSIZE + 4); in jsimd_idct_islow_neon() 287 bitmap = vorr_s16(bitmap, row0); in jsimd_idct_islow_neon() 291 int16x4_t dcval = vshl_n_s16(vmul_s16(row0, quant_row0), PASS1_BITS); in jsimd_idct_islow_neon() 299 jsimd_idct_islow_pass1_sparse(row0, row in jsimd_idct_islow_neon() 338 jsimd_idct_islow_pass1_regular(int16x4_t row0, int16x4_t row1, int16x4_t row2, int16x4_t row3, int16x4_t row4, int16x4_t row5, int16x4_t row6, int16x4_t row7, int16x4_t quant_row0, int16x4_t quant_row1, int16x4_t quant_row2, int16x4_t quant_row3, int16x4_t quant_row4, int16x4_t quant_row5, int16x4_t quant_row6, int16x4_t quant_row7, int16_t *workspace_1, int16_t *workspace_2) jsimd_idct_islow_pass1_regular() argument 473 jsimd_idct_islow_pass1_sparse(int16x4_t row0, int16x4_t row1, int16x4_t row2, int16x4_t row3, int16x4_t quant_row0, int16x4_t quant_row1, int16x4_t quant_row2, int16x4_t quant_row3, int16_t *workspace_1, int16_t *workspace_2) jsimd_idct_islow_pass1_sparse() argument [all...] |
H A D | jidctfst-neon.c | 69 int16x8_t row0 = vld1q_s16(coef_block + 0 * DCTSIZE); in jsimd_idct_ifast_neon() local 81 row0 = vmulq_s16(row0, quant_row0); in jsimd_idct_ifast_neon() 101 int16x8_t dcval = row0; in jsimd_idct_ifast_neon() 113 int16x4_t dcval = vget_low_s16(row0); in jsimd_idct_ifast_neon() 127 int16x4_t tmp0 = vget_high_s16(row0); in jsimd_idct_ifast_neon() 176 row0 = vcombine_s16(dcval, vadd_s16(tmp0, tmp7)); in jsimd_idct_ifast_neon() 188 int16x4_t dcval = vget_high_s16(row0); in jsimd_idct_ifast_neon() 202 int16x4_t tmp0 = vget_low_s16(row0); in jsimd_idct_ifast_neon() 251 row0 in jsimd_idct_ifast_neon() [all...] |
H A D | jfdctfst-neon.c | 152 int16x8_t row0 = vreinterpretq_s16_s32(rows_04.val[0]); in jsimd_fdct_ifast_neon() local 163 tmp0 = vaddq_s16(row0, row7); in jsimd_fdct_ifast_neon() 164 tmp7 = vsubq_s16(row0, row7); in jsimd_fdct_ifast_neon() 178 row0 = vaddq_s16(tmp10, tmp11); /* phase 3 */ in jsimd_fdct_ifast_neon() 206 vst1q_s16(data + 0 * DCTSIZE, row0); in jsimd_fdct_ifast_neon()
|
H A D | jfdctint-neon.c | 251 int16x8_t row0 = vreinterpretq_s16_s32(rows_04.val[0]); in jsimd_fdct_islow_neon() local 262 tmp0 = vaddq_s16(row0, row7); in jsimd_fdct_islow_neon() 263 tmp7 = vsubq_s16(row0, row7); in jsimd_fdct_islow_neon() 277 row0 = vrshrq_n_s16(vaddq_s16(tmp10, tmp11), PASS1_BITS); in jsimd_fdct_islow_neon() 368 vst1q_s16(data + 0 * DCTSIZE, row0); in jsimd_fdct_islow_neon()
|
/third_party/skia/third_party/externals/libjpeg-turbo/simd/arm/aarch32/ |
H A D | jchuff-neon.c | 52 int16x8_t row0 = vdupq_n_s16(block[0] - last_dc_val); in jsimd_huff_encode_one_block_neon() local 53 row0 = vld1q_lane_s16(block + 1, row0, 1); in jsimd_huff_encode_one_block_neon() 54 row0 = vld1q_lane_s16(block + 8, row0, 2); in jsimd_huff_encode_one_block_neon() 55 row0 = vld1q_lane_s16(block + 16, row0, 3); in jsimd_huff_encode_one_block_neon() 56 row0 = vld1q_lane_s16(block + 9, row0, 4); in jsimd_huff_encode_one_block_neon() 57 row0 in jsimd_huff_encode_one_block_neon() [all...] |
/third_party/skia/third_party/externals/swiftshader/src/Pipeline/ |
H A D | ShaderCore.cpp | 472 void transpose4x4(Short4 &row0, Short4 &row1, Short4 &row2, Short4 &row3) in transpose4x4() argument 474 Int2 tmp0 = UnpackHigh(row0, row1); in transpose4x4() 476 Int2 tmp2 = UnpackLow(row0, row1); in transpose4x4() 479 row0 = UnpackLow(tmp2, tmp3); in transpose4x4() 485 void transpose4x3(Short4 &row0, Short4 &row1, Short4 &row2, Short4 &row3) in transpose4x3() argument 487 Int2 tmp0 = UnpackHigh(row0, row1); in transpose4x3() 489 Int2 tmp2 = UnpackLow(row0, row1); in transpose4x3() 492 row0 = UnpackLow(tmp2, tmp3); in transpose4x3() 497 void transpose4x4(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3) in transpose4x4() argument 499 Float4 tmp0 = UnpackLow(row0, row in transpose4x4() 510 transpose4x3(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3) transpose4x3() argument 522 transpose4x2(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3) transpose4x2() argument 531 transpose4x1(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3) transpose4x1() argument 539 transpose2x4(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3) transpose2x4() argument 550 transpose4xN(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3, int N) transpose4xN() argument [all...] |
H A D | ShaderCore.hpp | 214 void transpose4x4(Short4 &row0, Short4 &row1, Short4 &row2, Short4 &row3); 215 void transpose4x3(Short4 &row0, Short4 &row1, Short4 &row2, Short4 &row3); 216 void transpose4x4(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3); 217 void transpose4x3(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3); 218 void transpose4x2(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3); 219 void transpose4x1(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3); 220 void transpose2x4(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3); 221 void transpose4xN(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3, int N);
|
/third_party/skia/docs/examples/ |
H A D | Bitmap_getAddr.cpp | 7 char* row0 = (char* ) source.getAddr(0, 0); in REG_FIDDLE() local 10 (size_t) (row1 - row0) == source.rowBytes() ? '=' : '!'); in REG_FIDDLE()
|
H A D | Bitmap_getAddr32.cpp | 7 uint32_t* row0 = source.getAddr32(0, 0); in REG_FIDDLE() local 9 size_t interval = (row1 - row0) * source.bytesPerPixel(); in REG_FIDDLE()
|
H A D | Bitmap_getAddr16.cpp | 12 uint16_t* row0 = bitmap16.getAddr16(0, 0); in REG_FIDDLE() local 14 size_t interval = (row1 - row0) * bitmap16.bytesPerPixel(); in REG_FIDDLE()
|
/third_party/ffmpeg/libavcodec/mips/ |
H A D | vp8_lpf_msa.c | 380 v16u8 row0, row1, row2, row3, row4, row5, row6, row7, row8; in ff_vp8_h_loop_filter16_msa() local 388 LD_UB8(temp_src, pitch, row0, row1, row2, row3, row4, row5, row6, row7); in ff_vp8_h_loop_filter16_msa() 392 TRANSPOSE16x8_UB_UB(row0, row1, row2, row3, row4, row5, row6, row7, in ff_vp8_h_loop_filter16_msa() 445 v16u8 row0, row1, row2, row3, row4, row5, row6, row7, row8; in ff_vp8_h_loop_filter8uv_msa() local 453 LD_UB8(src_u - 4, pitch, row0, row1, row2, row3, row4, row5, row6, row7); in ff_vp8_h_loop_filter8uv_msa() 456 TRANSPOSE16x8_UB_UB(row0, row1, row2, row3, row4, row5, row6, row7, in ff_vp8_h_loop_filter8uv_msa() 525 v16u8 row0, row1, row2, row3, row4, row5, row6, row7, row8; in ff_vp8_h_loop_filter_simple_msa() local 531 LD_UB8(temp_src, pitch, row0, row1, row2, row3, row4, row5, row6, row7); in ff_vp8_h_loop_filter_simple_msa() 535 TRANSPOSE16x4_UB_UB(row0, row1, row2, row3, row4, row5, row6, row7, in ff_vp8_h_loop_filter_simple_msa() 595 v16u8 row0, row in ff_vp8_h_loop_filter8uv_inner_msa() local 649 v16u8 row0, row1, row2, row3, row4, row5, row6, row7; ff_vp8_h_loop_filter16_inner_msa() local [all...] |
/third_party/skia/third_party/externals/swiftshader/src/Shader/ |
H A D | ShaderCore.hpp | 87 void transpose4x4(Short4 &row0, Short4 &row1, Short4 &row2, Short4 &row3); 88 void transpose4x3(Short4 &row0, Short4 &row1, Short4 &row2, Short4 &row3); 89 void transpose4x4(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3); 90 void transpose4x3(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3); 91 void transpose4x2(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3); 92 void transpose4x1(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3); 93 void transpose2x4(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3); 94 void transpose4xN(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3, int N);
|
H A D | ShaderCore.cpp | 488 void transpose4x4(Short4 &row0, Short4 &row1, Short4 &row2, Short4 &row3) in transpose4x4() argument 490 Int2 tmp0 = UnpackHigh(row0, row1); in transpose4x4() 492 Int2 tmp2 = UnpackLow(row0, row1); in transpose4x4() 495 row0 = UnpackLow(tmp2, tmp3); in transpose4x4() 501 void transpose4x3(Short4 &row0, Short4 &row1, Short4 &row2, Short4 &row3) in transpose4x3() argument 503 Int2 tmp0 = UnpackHigh(row0, row1); in transpose4x3() 505 Int2 tmp2 = UnpackLow(row0, row1); in transpose4x3() 508 row0 = UnpackLow(tmp2, tmp3); in transpose4x3() 513 void transpose4x4(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3) in transpose4x4() argument 515 Float4 tmp0 = UnpackLow(row0, row in transpose4x4() 526 transpose4x3(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3) transpose4x3() argument 538 transpose4x2(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3) transpose4x2() argument 547 transpose4x1(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3) transpose4x1() argument 555 transpose2x4(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3) transpose2x4() argument 566 transpose4xN(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3, int N) transpose4xN() argument [all...] |
H A D | VertexProgram.cpp | 1018 Vector4f row0 = fetchRegister(src1, 0); in M3X2() local 1021 dst.x = dot3(src0, row0); in M3X2() 1027 Vector4f row0 = fetchRegister(src1, 0); in M3X3() local 1031 dst.x = dot3(src0, row0); in M3X3() 1038 Vector4f row0 = fetchRegister(src1, 0); in M3X4() local 1043 dst.x = dot3(src0, row0); in M3X4() 1051 Vector4f row0 = fetchRegister(src1, 0); in M4X3() local 1055 dst.x = dot4(src0, row0); in M4X3() 1062 Vector4f row0 = fetchRegister(src1, 0); in M4X4() local 1067 dst.x = dot4(src0, row0); in M4X4() [all...] |
/third_party/skia/third_party/externals/libjpeg-turbo/simd/arm/aarch64/ |
H A D | jchuff-neon.c | 121 int16x8_t row0 = in jsimd_huff_encode_one_block_neon() local 139 row0 = vsetq_lane_s16(block[0] - last_dc_val, row0, 0); in jsimd_huff_encode_one_block_neon() 161 int16x8_t abs_row0 = vabsq_s16(row0); in jsimd_huff_encode_one_block_neon() 172 vreinterpretq_u16_s16(veorq_s16(abs_row0, vshrq_n_s16(row0, 15))); in jsimd_huff_encode_one_block_neon()
|
/third_party/ffmpeg/libavcodec/loongarch/ |
H A D | h264dsp_lasx.c | 96 __m256i row0, row1, row2, row3, row4, row5, row6, row7; in ff_h264_h_lpf_luma_8_lasx() local 100 src, img_width_3x, row0, row1, row2, row3); in ff_h264_h_lpf_luma_8_lasx() 114 LASX_TRANSPOSE16x8_B(row0, row1, row2, row3, row4, row5, row6, in ff_h264_h_lpf_luma_8_lasx() 201 __m256i row0, row1, row2, row3, row4, row5, row6, row7; in ff_h264_h_lpf_luma_8_lasx() local 209 row0, row2); in ff_h264_h_lpf_luma_8_lasx() 212 DUP2_ARG2(__lasx_xvilvl_b, row2, row0, row3, row1, row4, row6); in ff_h264_h_lpf_luma_8_lasx() 213 DUP2_ARG2(__lasx_xvilvh_b, row2, row0, row3, row1, row5, row7); in ff_h264_h_lpf_luma_8_lasx() 393 __m256i row0, row1, row2, row3, row4, row5, row6, row7; in ff_h264_h_lpf_chroma_8_lasx() local 396 src, img_width_3x, row0, row1, row2, row3); in ff_h264_h_lpf_chroma_8_lasx() 402 DUP4_ARG2(__lasx_xvilvl_b, row2, row0, row in ff_h264_h_lpf_chroma_8_lasx() 597 __m256i row0, row1, row2, row3, row4, row5, row6, row7; ff_h264_h_lpf_luma_intra_8_lasx() local 717 __m256i row0, row1, row2, row3, row4, row5, row6, row7; ff_h264_h_lpf_luma_intra_8_lasx() local 892 __m256i row0, row1, row2, row3, row4, row5, row6, row7; ff_h264_h_lpf_chroma_intra_8_lasx() local [all...] |
H A D | vp8_lpf_lsx.c | 335 __m128i row0, row1, row2, row3, row4, row5, row6, row7, row8; in ff_vp8_h_loop_filter16_lsx() local 349 temp_src + stride3, 0, row0, row1, row2, row3); in ff_vp8_h_loop_filter16_lsx() 360 LSX_TRANSPOSE16x8_B(row0, row1, row2, row3, row4, row5, row6, row7, row8, row9, row10, in ff_vp8_h_loop_filter16_lsx() 422 __m128i row0, row1, row2, row3, row4, row5, row6, row7, row8; in ff_vp8_h_loop_filter8uv_lsx() local 436 temp_src + stride3, 0, row0, row1, row2, row3); in ff_vp8_h_loop_filter8uv_lsx() 448 LSX_TRANSPOSE16x8_B(row0, row1, row2, row3, row4, row5, row6, row7, in ff_vp8_h_loop_filter8uv_lsx()
|
/third_party/skia/third_party/externals/libwebp/src/dsp/ |
H A D | dec_msa.c | 364 v16u8 row0, row1, row2, row3, row4, row5, row6, row7, row8; in HFilter16() local 371 LD_UB8(ptmp, stride, row0, row1, row2, row3, row4, row5, row6, row7); in HFilter16() 374 TRANSPOSE16x8_UB_UB(row0, row1, row2, row3, row4, row5, row6, row7, in HFilter16() 446 v16u8 row0, row1, row2, row3, row4, row5, row6, row7; in HFilterVertEdge16i() local 453 LD_UB8(src - 4, stride, row0, row1, row2, row3, row4, row5, row6, row7); in HFilterVertEdge16i() 456 TRANSPOSE16x8_UB_UB(row0, row1, row2, row3, row4, row5, row6, row7, in HFilterVertEdge16i() 530 v16u8 row0, row1, row2, row3, row4, row5, row6, row7, row8; in HFilter8() local 537 LD_UB8(ptmp_src_u, stride, row0, row1, row2, row3, row4, row5, row6, row7); in HFilter8() 540 TRANSPOSE16x8_UB_UB(row0, row1, row2, row3, row4, row5, row6, row7, in HFilter8() 595 v16u8 row0, row in HFilter8i() local 636 v16u8 p1, p0, q1, q0, mask, row0, row1, row2, row3, row4, row5, row6, row7; SimpleHFilter16() local [all...] |
/third_party/skia/src/core/ |
H A D | SkBitmapProcState.cpp | 495 const SkPMColor* row0 = s.fPixmap.addr32(0, iY0); in S32_D32_constX_shaderproc() local 500 filter_32_alpha(iSubY, *row0, *row1, &color, s.fAlphaScale); in S32_D32_constX_shaderproc() 503 color = SkAlphaMulQ(*row0, s.fAlphaScale); in S32_D32_constX_shaderproc() 505 color = *row0; in S32_D32_constX_shaderproc()
|
/third_party/backends/backend/genesys/ |
H A D | image_pipeline.cpp | 306 const auto* row0 = buffer_.get_row_ptr(0); in get_next_row_data() local 313 std::uint16_t ch0 = get_raw_channel_from_row(row0, x, 0, format); in get_next_row_data() 513 const auto* row0 = buffer_.get_row_ptr(channel_shifts_[0]); in get_next_row_data() local 518 std::uint16_t ch0 = get_raw_channel_from_row(row0, x, 0, format); in get_next_row_data()
|
/third_party/skia/third_party/externals/libjpeg-turbo/simd/i386/ |
H A D | jidctred-sse2.asm | 553 paddd xmm1, xmm7 ; xmm1=tmp0[row0 row1 row0 row1] 557 pslld xmm6, (CONST_BITS+2) ; xmm6=tmp10[row0 row1 **** ****] 562 paddd xmm6, xmm1 ; xmm6=data0[row0 row1 **** ****]=(C0 C1 ** **) 563 psubd xmm4, xmm1 ; xmm4=data1[row0 row1 **** ****]=(D0 D1 ** **)
|
/third_party/skia/third_party/externals/libjpeg-turbo/simd/x86_64/ |
H A D | jidctred-sse2.asm | 538 paddd xmm1, xmm7 ; xmm1=tmp0[row0 row1 row0 row1] 542 pslld xmm6, (CONST_BITS+2) ; xmm6=tmp10[row0 row1 **** ****] 547 paddd xmm6, xmm1 ; xmm6=data0[row0 row1 **** ****]=(C0 C1 ** **) 548 psubd xmm4, xmm1 ; xmm4=data1[row0 row1 **** ****]=(D0 D1 ** **)
|