summaryrefslogtreecommitdiffstats
path: root/media/libstagefright/codecs/on2/h264dec/omxdl/reference/vc/m4p10/src/omxVCM4P10_PredictIntra_4x4.c
blob: 3fa8212778d5249f4d26a75cd407ee19cb1974a7 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
/* ----------------------------------------------------------------
 *
 * 
 * File Name:  omxVCM4P10_PredictIntra_4x4.c
 * OpenMAX DL: v1.0.2
 * Revision:   9641
 * Date:       Thursday, February 7, 2008
 * 
 * (c) Copyright 2007-2008 ARM Limited. All Rights Reserved.
 * 
 * 
 *
 * H.264 4x4 intra prediction module
 * 
 */
 
#include "omxtypes.h"
#include "armOMX.h"
#include "omxVC.h"

#include "armCOMM.h"
#include "armVC.h"

/**
 * Function:  omxVCM4P10_PredictIntra_4x4   (6.3.3.1.1)
 *
 * Description:
 * Perform Intra_4x4 prediction for luma samples. If the upper-right block is 
 * not available, then duplication work should be handled inside the function. 
 * Users need not define them outside. 
 *
 * Input Arguments:
 *   
 *   pSrcLeft -  Pointer to the buffer of 4 left pixels: 
 *                  p[x, y] (x = -1, y = 0..3) 
 *   pSrcAbove - Pointer to the buffer of 8 above pixels: 
 *                  p[x,y] (x = 0..7, y =-1); 
 *               must be aligned on a 4-byte boundary. 
 *   pSrcAboveLeft - Pointer to the above left pixels: p[x,y] (x = -1, y = -1) 
 *   leftStep - Step of left pixel buffer; must be a multiple of 4. 
 *   dstStep - Step of the destination buffer; must be a multiple of 4. 
 *   predMode - Intra_4x4 prediction mode. 
 *   availability - Neighboring 4x4 block availability flag, refer to 
 *             "Neighboring Macroblock Availability" . 
 *
 * Output Arguments:
 *   
 *   pDst - Pointer to the destination buffer; must be aligned on a 4-byte 
 *            boundary. 
 *
 * Return Value:
 *    If the function runs without error, it returns OMX_Sts_NoErr. 
 *    If one of the following cases occurs, the function returns 
 *              OMX_Sts_BadArgErr: 
 *    pDst is NULL. 
 *    dstStep < 4, or dstStep is not a multiple of 4. 
 *    leftStep is not a multiple of 4. 
 *    predMode is not in the valid range of enumeration 
 *              OMXVCM4P10Intra4x4PredMode. 
 *    predMode is OMX_VC_4x4_VERT, but availability doesn't set OMX_VC_UPPER 
 *              indicating p[x,-1] (x = 0..3) is not available. 
 *    predMode is OMX_VC_4x4_HOR, but availability doesn't set OMX_VC_LEFT 
 *              indicating p[-1,y] (y = 0..3) is not available. 
 *    predMode is OMX_VC_4x4_DIAG_DL, but availability doesn't set 
 *              OMX_VC_UPPER indicating p[x, 1] (x = 0..3) is not available. 
 *    predMode is OMX_VC_4x4_DIAG_DR, but availability doesn't set 
 *              OMX_VC_UPPER_LEFT or OMX_VC_UPPER or OMX_VC_LEFT indicating 
 *              p[x,-1] (x = 0..3), or p[-1,y] (y = 0..3) or p[-1,-1] is not 
 *              available. 
 *    predMode is OMX_VC_4x4_VR, but availability doesn't set 
 *              OMX_VC_UPPER_LEFT or OMX_VC_UPPER or OMX_VC_LEFT indicating 
 *              p[x,-1] (x = 0..3), or p[-1,y] (y = 0..3) or p[-1,-1] is not 
 *              available. 
 *    predMode is OMX_VC_4x4_HD, but availability doesn't set 
 *              OMX_VC_UPPER_LEFT or OMX_VC_UPPER or OMX_VC_LEFT indicating 
 *              p[x,-1] (x = 0..3), or p[-1,y] (y = 0..3) or p[-1,-1] is not 
 *              available. 
 *    predMode is OMX_VC_4x4_VL, but availability doesn't set OMX_VC_UPPER 
 *              indicating p[x,-1] (x = 0..3) is not available. 
 *    predMode is OMX_VC_4x4_HU, but availability doesn't set OMX_VC_LEFT 
 *              indicating p[-1,y] (y = 0..3) is not available. 
 *    availability sets OMX_VC_UPPER, but pSrcAbove is NULL. 
 *    availability sets OMX_VC_LEFT, but pSrcLeft is NULL. 
 *    availability sets OMX_VC_UPPER_LEFT, but pSrcAboveLeft is NULL. 
 *    either pSrcAbove or pDst is not aligned on a 4-byte boundary.  
 *
 * Note: 
 *     pSrcAbove, pSrcAbove, pSrcAboveLeft may be invalid pointers if 
 *     they are not used by intra prediction as implied in predMode. 
 *
 */

OMXResult omxVCM4P10_PredictIntra_4x4(
     const OMX_U8* pSrcLeft,
     const OMX_U8 *pSrcAbove,
     const OMX_U8 *pSrcAboveLeft,
     OMX_U8* pDst,
     OMX_INT leftStep,
     OMX_INT dstStep,
     OMXVCM4P10Intra4x4PredMode predMode,
     OMX_S32 availability        
 )
{
    int x, y;
    OMX_U8 pTmp[10];

    armRetArgErrIf(pDst == NULL, OMX_Sts_BadArgErr);
    armRetArgErrIf((leftStep % 4) != 0,  OMX_Sts_BadArgErr);
    armRetArgErrIf((dstStep % 4) != 0,  OMX_Sts_BadArgErr);
    armRetArgErrIf((dstStep < 4),  OMX_Sts_BadArgErr);
    armRetArgErrIf(armNot4ByteAligned(pSrcAbove), OMX_Sts_BadArgErr);
    armRetArgErrIf(armNot4ByteAligned(pDst), OMX_Sts_BadArgErr);    
    armRetArgErrIf((availability & OMX_VC_UPPER)      && pSrcAbove     == NULL, OMX_Sts_BadArgErr);
    armRetArgErrIf((availability & OMX_VC_LEFT )      && pSrcLeft      == NULL, OMX_Sts_BadArgErr);
    armRetArgErrIf((availability & OMX_VC_UPPER_LEFT) && pSrcAboveLeft == NULL, OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_VERT    && !(availability & OMX_VC_UPPER),      OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_HOR     && !(availability & OMX_VC_LEFT),       OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_DIAG_DL && !(availability & OMX_VC_UPPER),      OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_DIAG_DR && !(availability & OMX_VC_UPPER),      OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_DIAG_DR && !(availability & OMX_VC_UPPER_LEFT), OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_DIAG_DR && !(availability & OMX_VC_LEFT),       OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_VR      && !(availability & OMX_VC_UPPER),      OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_VR      && !(availability & OMX_VC_UPPER_LEFT), OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_VR      && !(availability & OMX_VC_LEFT),       OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_HD      && !(availability & OMX_VC_UPPER),      OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_HD      && !(availability & OMX_VC_UPPER_LEFT), OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_HD      && !(availability & OMX_VC_LEFT),       OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_VL      && !(availability & OMX_VC_UPPER),      OMX_Sts_BadArgErr);
    armRetArgErrIf(predMode==OMX_VC_4X4_HU      && !(availability & OMX_VC_LEFT),       OMX_Sts_BadArgErr);
    armRetArgErrIf((unsigned)predMode > OMX_VC_4X4_HU,   OMX_Sts_BadArgErr);    
    
    /* Note: This code must not read the pSrc arrays unless the corresponding
     * block is marked as available. If the block is not avaibable then pSrc
     * may not be a valid pointer.
     *
     * Note: To make the code more readable we refer to the neighbouring pixels
     * in variables named as below:
     *
     *    UL U0 U1 U2 U3 U4 U5 U6 U7
     *    L0 xx xx xx xx
     *    L1 xx xx xx xx
     *    L2 xx xx xx xx
     *    L3 xx xx xx xx
     */
     
#define UL pSrcAboveLeft[0]
#define U0 pSrcAbove[0]
#define U1 pSrcAbove[1]
#define U2 pSrcAbove[2]
#define U3 pSrcAbove[3]
#define U4 pSrcAbove[4]
#define U5 pSrcAbove[5]
#define U6 pSrcAbove[6]
#define U7 pSrcAbove[7]
#define L0 pSrcLeft[0*leftStep]
#define L1 pSrcLeft[1*leftStep]
#define L2 pSrcLeft[2*leftStep]
#define L3 pSrcLeft[3*leftStep]

    switch (predMode)
    {
    case OMX_VC_4X4_VERT:
        for (y=0; y<4; y++)
        {
            pDst[y*dstStep+0] = U0;
            pDst[y*dstStep+1] = U1;
            pDst[y*dstStep+2] = U2;
            pDst[y*dstStep+3] = U3;
        }
        break;

    case OMX_VC_4X4_HOR:
        for (x=0; x<4; x++)
        {
            pDst[0*dstStep+x] = L0;
            pDst[1*dstStep+x] = L1;
            pDst[2*dstStep+x] = L2;
            pDst[3*dstStep+x] = L3;
        }
        break;
    
    case OMX_VC_4X4_DC:
        /* This can always be used even if no blocks available */
        armVCM4P10_PredictIntraDC4x4(pSrcLeft, pSrcAbove, pDst, leftStep, dstStep, availability);
        break;
        
    case OMX_VC_4X4_DIAG_DL:
        pTmp[0] = (OMX_U8)((U0 + 2*U1 + U2 + 2)>>2);
        pTmp[1] = (OMX_U8)((U1 + 2*U2 + U3 + 2)>>2);
        if (availability & OMX_VC_UPPER_RIGHT)
        {
            pTmp[2] = (OMX_U8)((U2 + 2*U3 + U4 + 2)>>2);
            pTmp[3] = (OMX_U8)((U3 + 2*U4 + U5 + 2)>>2);
            pTmp[4] = (OMX_U8)((U4 + 2*U5 + U6 + 2)>>2);
            pTmp[5] = (OMX_U8)((U5 + 2*U6 + U7 + 2)>>2);
            pTmp[6] = (OMX_U8)((U6 + 3*U7      + 2)>>2);
        }
        else
        {
            pTmp[2] = (OMX_U8)((U2 + 3*U3      + 2)>>2);
            pTmp[3] = U3;
            pTmp[4] = U3;
            pTmp[5] = U3;
            pTmp[6] = U3;
        }
        for (y=0; y<4; y++)
        {
            for (x=0; x<4; x++)
            {
                pDst[y*dstStep+x] = pTmp[x+y];
            }
        }
        break;

    case OMX_VC_4X4_DIAG_DR:        
        /* x-y = -3, -2, -1, 0, 1, 2, 3 */
        pTmp[0] = (OMX_U8)((L1 + 2*L2 + L3 + 2)>>2);
        pTmp[1] = (OMX_U8)((L0 + 2*L1 + L2 + 2)>>2);
        pTmp[2] = (OMX_U8)((UL + 2*L0 + L1 + 2)>>2);
        pTmp[3] = (OMX_U8)((U0 + 2*UL + L0 + 2)>>2);
        pTmp[4] = (OMX_U8)((U1 + 2*U0 + UL + 2)>>2);
        pTmp[5] = (OMX_U8)((U2 + 2*U1 + U0 + 2)>>2);
        pTmp[6] = (OMX_U8)((U3 + 2*U2 + U1 + 2)>>2);
        for (y=0; y<4; y++)
        {
            for (x=0; x<4; x++)
            {
                pDst[y*dstStep+x] = pTmp[3+x-y];
            }
        }
        break;

    case OMX_VC_4X4_VR:
        /* zVR=2x-y = -3, -2, -1, 0, 1, 2, 3, 4, 5, 6
         * x-(y>>1) = -1, -1,  0, 0, 1, 1, 2, 2, 3, 3
         * y        =  3,  2,  ?, ?, ?, ?, ?, ?, 1, 0
         */
        pTmp[0] = (OMX_U8)((L2 + 2*L1 + L0 + 2)>>2);
        pTmp[1] = (OMX_U8)((L1 + 2*L0 + UL + 2)>>2);
        pTmp[2] = (OMX_U8)((L0 + 2*UL + U0 + 2)>>2);
        pTmp[3] = (OMX_U8)((UL + U0 + 1)>>1);
        pTmp[4] = (OMX_U8)((UL + 2*U0 + U1 + 2)>>2);
        pTmp[5] = (OMX_U8)((U0 + U1 + 1)>>1);
        pTmp[6] = (OMX_U8)((U0 + 2*U1 + U2 + 2)>>2);
        pTmp[7] = (OMX_U8)((U1 + U2 + 1)>>1);
        pTmp[8] = (OMX_U8)((U1 + 2*U2 + U3 + 2)>>2);
        pTmp[9] = (OMX_U8)((U2 + U3 + 1)>>1);
        for (y=0; y<4; y++)
        {
            for (x=0; x<4; x++)
            {
                pDst[y*dstStep+x] = pTmp[3+2*x-y];
            }
        }
        break;

    case OMX_VC_4X4_HD:
        /* zHD=2y-x = -3 -2 -1  0  1  2  3  4  5  6
         * y-(x>>1) = -1 -1  0  0  1  1  2  2  3  3
         * x        =  3  2                    1  0
         */
        pTmp[0] = (OMX_U8)((U2 + 2*U1 + U0 + 2)>>2);
        pTmp[1] = (OMX_U8)((U1 + 2*U0 + UL + 2)>>2);
        pTmp[2] = (OMX_U8)((U0 + 2*UL + L0 + 2)>>2);
        pTmp[3] = (OMX_U8)((UL + L0 + 1)>>1);
        pTmp[4] = (OMX_U8)((UL + 2*L0 + L1 + 2)>>2);
        pTmp[5] = (OMX_U8)((L0 + L1 + 1)>>1);
        pTmp[6] = (OMX_U8)((L0 + 2*L1 + L2 + 2)>>2);
        pTmp[7] = (OMX_U8)((L1 + L2 + 1)>>1);
        pTmp[8] = (OMX_U8)((L1 + 2*L2 + L3 + 2)>>2);
        pTmp[9] = (OMX_U8)((L2 + L3 + 1)>>1);
        for (y=0; y<4; y++)
        {
            for (x=0; x<4; x++)
            {
                pDst[y*dstStep+x] = pTmp[3+2*y-x];
            }
        }
        break;

    case OMX_VC_4X4_VL:
        /* Note: x+(y>>1) = (2*x+y)>>1
         * 2x+y = 0 1 2 3 4 5 6 7 8 9
         */
        pTmp[0] = (OMX_U8)((U0 + U1 + 1)>>1);
        pTmp[1] = (OMX_U8)((U0 + 2*U1 + U2 + 2)>>2);
        pTmp[2] = (OMX_U8)((U1 + U2 + 1)>>1);
        pTmp[3] = (OMX_U8)((U1 + 2*U2 + U3 + 2)>>2);
        pTmp[4] = (OMX_U8)((U2 + U3 + 1)>>1);
        if (availability & OMX_VC_UPPER_RIGHT)
        {
            pTmp[5] = (OMX_U8)((U2 + 2*U3 + U4 + 2)>>2);
            pTmp[6] = (OMX_U8)((U3 + U4 + 1)>>1);
            pTmp[7] = (OMX_U8)((U3 + 2*U4 + U5 + 2)>>2);
            pTmp[8] = (OMX_U8)((U4 + U5 + 1)>>1);
            pTmp[9] = (OMX_U8)((U4 + 2*U5 + U6 + 2)>>2);
        }
        else
        {
            pTmp[5] = (OMX_U8)((U2 + 3*U3 + 2)>>2);
            pTmp[6] = U3;
            pTmp[7] = U3;
            pTmp[8] = U3;
            pTmp[9] = U3;
        }
        for (y=0; y<4; y++)
        {
            for (x=0; x<4; x++)
            {
                pDst[y*dstStep+x] = pTmp[2*x+y];
            }
        }
        break;

    case OMX_VC_4X4_HU:
        /* zHU = x+2*y */
        pTmp[0] = (OMX_U8)((L0 + L1 + 1)>>1);
        pTmp[1] = (OMX_U8)((L0 + 2*L1 + L2 + 2)>>2);
        pTmp[2] = (OMX_U8)((L1 + L2 + 1)>>1);
        pTmp[3] = (OMX_U8)((L1 + 2*L2 + L3 + 2)>>2);
        pTmp[4] = (OMX_U8)((L2 + L3 + 1)>>1);
        pTmp[5] = (OMX_U8)((L2 + 3*L3 + 2)>>2);
        pTmp[6] = L3;
        pTmp[7] = L3;
        pTmp[8] = L3;
        pTmp[9] = L3;
        for (y=0; y<4; y++)
        {
            for (x=0; x<4; x++)
            {
                pDst[y*dstStep+x] = pTmp[x+2*y];
            }
        }
        break;
    }

    return OMX_Sts_NoErr;
}