1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * rectangle filling function
3cabdff1aSopenharmony_ci * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
4cabdff1aSopenharmony_ci *
5cabdff1aSopenharmony_ci * This file is part of FFmpeg.
6cabdff1aSopenharmony_ci *
7cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
8cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
9cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
10cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
11cabdff1aSopenharmony_ci *
12cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
13cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
14cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15cabdff1aSopenharmony_ci * Lesser General Public License for more details.
16cabdff1aSopenharmony_ci *
17cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
18cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
19cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20cabdff1aSopenharmony_ci */
21cabdff1aSopenharmony_ci
22cabdff1aSopenharmony_ci/**
23cabdff1aSopenharmony_ci * @file
24cabdff1aSopenharmony_ci * useful rectangle filling function
25cabdff1aSopenharmony_ci * @author Michael Niedermayer <michaelni@gmx.at>
26cabdff1aSopenharmony_ci */
27cabdff1aSopenharmony_ci
28cabdff1aSopenharmony_ci#ifndef AVCODEC_RECTANGLE_H
29cabdff1aSopenharmony_ci#define AVCODEC_RECTANGLE_H
30cabdff1aSopenharmony_ci
31cabdff1aSopenharmony_ci#include "config.h"
32cabdff1aSopenharmony_ci#include "libavutil/common.h"
33cabdff1aSopenharmony_ci#include "libavutil/avassert.h"
34cabdff1aSopenharmony_ci
35cabdff1aSopenharmony_ci/**
36cabdff1aSopenharmony_ci * fill a rectangle.
37cabdff1aSopenharmony_ci * @param h height of the rectangle, should be a constant
38cabdff1aSopenharmony_ci * @param w width of the rectangle, should be a constant
39cabdff1aSopenharmony_ci * @param size the size of val (1, 2 or 4), should be a constant
40cabdff1aSopenharmony_ci */
41cabdff1aSopenharmony_cistatic av_always_inline void fill_rectangle(void *vp, int w, int h, int stride, uint32_t val, int size){
42cabdff1aSopenharmony_ci    uint8_t *p= (uint8_t*)vp;
43cabdff1aSopenharmony_ci    av_assert2(size==1 || size==2 || size==4);
44cabdff1aSopenharmony_ci    av_assert2(w<=4);
45cabdff1aSopenharmony_ci
46cabdff1aSopenharmony_ci    w      *= size;
47cabdff1aSopenharmony_ci    stride *= size;
48cabdff1aSopenharmony_ci
49cabdff1aSopenharmony_ci    av_assert2((((long)vp)&(FFMIN(w, 8<<(HAVE_NEON|ARCH_PPC|HAVE_MMX))-1)) == 0);
50cabdff1aSopenharmony_ci    av_assert2((stride&(w-1))==0);
51cabdff1aSopenharmony_ci    if(w==2){
52cabdff1aSopenharmony_ci        const uint16_t v= size==4 ? val : val*0x0101;
53cabdff1aSopenharmony_ci        *(uint16_t*)(p + 0*stride)= v;
54cabdff1aSopenharmony_ci        if(h==1) return;
55cabdff1aSopenharmony_ci        *(uint16_t*)(p + 1*stride)= v;
56cabdff1aSopenharmony_ci        if(h==2) return;
57cabdff1aSopenharmony_ci        *(uint16_t*)(p + 2*stride)= v;
58cabdff1aSopenharmony_ci        *(uint16_t*)(p + 3*stride)= v;
59cabdff1aSopenharmony_ci    }else if(w==4){
60cabdff1aSopenharmony_ci        const uint32_t v= size==4 ? val : size==2 ? val*0x00010001 : val*0x01010101;
61cabdff1aSopenharmony_ci        *(uint32_t*)(p + 0*stride)= v;
62cabdff1aSopenharmony_ci        if(h==1) return;
63cabdff1aSopenharmony_ci        *(uint32_t*)(p + 1*stride)= v;
64cabdff1aSopenharmony_ci        if(h==2) return;
65cabdff1aSopenharmony_ci        *(uint32_t*)(p + 2*stride)= v;
66cabdff1aSopenharmony_ci        *(uint32_t*)(p + 3*stride)= v;
67cabdff1aSopenharmony_ci    }else if(w==8){
68cabdff1aSopenharmony_ci    // gcc cannot optimize 64-bit math on x86_32
69cabdff1aSopenharmony_ci#if HAVE_FAST_64BIT
70cabdff1aSopenharmony_ci        const uint64_t v=  size==2 ? val*0x0001000100010001ULL : val*0x0100000001ULL;
71cabdff1aSopenharmony_ci        *(uint64_t*)(p + 0*stride)= v;
72cabdff1aSopenharmony_ci        if(h==1) return;
73cabdff1aSopenharmony_ci        *(uint64_t*)(p + 1*stride)= v;
74cabdff1aSopenharmony_ci        if(h==2) return;
75cabdff1aSopenharmony_ci        *(uint64_t*)(p + 2*stride)= v;
76cabdff1aSopenharmony_ci        *(uint64_t*)(p + 3*stride)= v;
77cabdff1aSopenharmony_ci    }else if(w==16){
78cabdff1aSopenharmony_ci        const uint64_t v= val*0x0100000001ULL;
79cabdff1aSopenharmony_ci        *(uint64_t*)(p + 0+0*stride)= v;
80cabdff1aSopenharmony_ci        *(uint64_t*)(p + 8+0*stride)= v;
81cabdff1aSopenharmony_ci        *(uint64_t*)(p + 0+1*stride)= v;
82cabdff1aSopenharmony_ci        *(uint64_t*)(p + 8+1*stride)= v;
83cabdff1aSopenharmony_ci        if(h==2) return;
84cabdff1aSopenharmony_ci        *(uint64_t*)(p + 0+2*stride)= v;
85cabdff1aSopenharmony_ci        *(uint64_t*)(p + 8+2*stride)= v;
86cabdff1aSopenharmony_ci        *(uint64_t*)(p + 0+3*stride)= v;
87cabdff1aSopenharmony_ci        *(uint64_t*)(p + 8+3*stride)= v;
88cabdff1aSopenharmony_ci#else
89cabdff1aSopenharmony_ci        const uint32_t v= size==2 ? val*0x00010001 : val;
90cabdff1aSopenharmony_ci        *(uint32_t*)(p + 0+0*stride)= v;
91cabdff1aSopenharmony_ci        *(uint32_t*)(p + 4+0*stride)= v;
92cabdff1aSopenharmony_ci        if(h==1) return;
93cabdff1aSopenharmony_ci        *(uint32_t*)(p + 0+1*stride)= v;
94cabdff1aSopenharmony_ci        *(uint32_t*)(p + 4+1*stride)= v;
95cabdff1aSopenharmony_ci        if(h==2) return;
96cabdff1aSopenharmony_ci        *(uint32_t*)(p + 0+2*stride)= v;
97cabdff1aSopenharmony_ci        *(uint32_t*)(p + 4+2*stride)= v;
98cabdff1aSopenharmony_ci        *(uint32_t*)(p + 0+3*stride)= v;
99cabdff1aSopenharmony_ci        *(uint32_t*)(p + 4+3*stride)= v;
100cabdff1aSopenharmony_ci    }else if(w==16){
101cabdff1aSopenharmony_ci        *(uint32_t*)(p + 0+0*stride)= val;
102cabdff1aSopenharmony_ci        *(uint32_t*)(p + 4+0*stride)= val;
103cabdff1aSopenharmony_ci        *(uint32_t*)(p + 8+0*stride)= val;
104cabdff1aSopenharmony_ci        *(uint32_t*)(p +12+0*stride)= val;
105cabdff1aSopenharmony_ci        *(uint32_t*)(p + 0+1*stride)= val;
106cabdff1aSopenharmony_ci        *(uint32_t*)(p + 4+1*stride)= val;
107cabdff1aSopenharmony_ci        *(uint32_t*)(p + 8+1*stride)= val;
108cabdff1aSopenharmony_ci        *(uint32_t*)(p +12+1*stride)= val;
109cabdff1aSopenharmony_ci        if(h==2) return;
110cabdff1aSopenharmony_ci        *(uint32_t*)(p + 0+2*stride)= val;
111cabdff1aSopenharmony_ci        *(uint32_t*)(p + 4+2*stride)= val;
112cabdff1aSopenharmony_ci        *(uint32_t*)(p + 8+2*stride)= val;
113cabdff1aSopenharmony_ci        *(uint32_t*)(p +12+2*stride)= val;
114cabdff1aSopenharmony_ci        *(uint32_t*)(p + 0+3*stride)= val;
115cabdff1aSopenharmony_ci        *(uint32_t*)(p + 4+3*stride)= val;
116cabdff1aSopenharmony_ci        *(uint32_t*)(p + 8+3*stride)= val;
117cabdff1aSopenharmony_ci        *(uint32_t*)(p +12+3*stride)= val;
118cabdff1aSopenharmony_ci#endif
119cabdff1aSopenharmony_ci    }else
120cabdff1aSopenharmony_ci        av_assert2(0);
121cabdff1aSopenharmony_ci    av_assert2(h==4);
122cabdff1aSopenharmony_ci}
123cabdff1aSopenharmony_ci
124cabdff1aSopenharmony_ci#endif /* AVCODEC_RECTANGLE_H */
125