43 const unsigned lt = src[-1-1*
stride];
49 (
t2 + 2*
t3 +
t4 + 2) >> 2);
58 const unsigned lt = src[-1-1*
stride];
61 AV_WN32A(src+0*stride, ((lt + 2*l0 + l1 + 2) >> 2)*0x01010101);
62 AV_WN32A(src+1*stride, ((l0 + 2*l1 + l2 + 2) >> 2)*0x01010101);
63 AV_WN32A(src+2*stride, ((l1 + 2*l2 + l3 + 2) >> 2)*0x01010101);
64 AV_WN32A(src+3*stride, ((l2 + 2*l3 + l3 + 2) >> 2)*0x01010101);
95 src[0+0*
stride]=(
t0 +
t2 + 2*
t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
97 src[0+1*
stride]=(
t1 +
t3 + 2*
t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
100 src[0+2*
stride]=(
t2 +
t4 + 2*
t3 + 2 + l2 + l4 + 2*l3 + 2)>>3;
104 src[0+3*
stride]=(
t3 +
t5 + 2*
t4 + 2 + l3 + l5 + 2*l4 + 2)>>3;
107 src[1+3*
stride]=(
t4 +
t6 + 2*
t5 + 2 + l4 + l6 + 2*l5 + 2)>>3;
109 src[2+3*
stride]=(
t5 +
t7 + 2*
t6 + 2 + l5 + l7 + 2*l6 + 2)>>3;
110 src[3+3*
stride]=(
t6 +
t7 + 1 + l6 + l7 + 1)>>2;
118 src[0+0*
stride]=(
t0 +
t2 + 2*
t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
120 src[0+1*
stride]=(
t1 +
t3 + 2*
t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
123 src[0+2*
stride]=(
t2 +
t4 + 2*
t3 + 2 + l2 + 3*l3 + 2)>>3;
137 const int l0,
const int l1,
const int l2,
const int l3,
const int l4){
141 src[0+0*
stride]=(2*
t0 + 2*
t1 + l1 + 2*l2 + l3 + 4)>>3;
149 src[0+1*
stride]=(
t0 + 2*
t1 +
t2 + l2 + 2*l3 + l4 + 4)>>3;
201 src[1+0*
stride]=(
t2 + 2*
t3 +
t4 + l0 + 2*l1 + l2 + 4)>>3;
205 src[1+1*
stride]=(
t4 + 2*
t5 +
t6 + l1 + 2*l2 + l3 + 4)>>3;
209 src[1+2*
stride]=(
t6 + 3*
t7 + l2 + 3*l3 + 4)>>3;
211 src[1+3*
stride]=(l3 + 2*l4 + l5 + 2)>>2;
214 src[2+3*
stride]=(l4 + l5 + 1)>>1;
215 src[3+3*
stride]=(l4 + 2*l5 + l6 + 2)>>2;
224 src[1+0*
stride]=(
t2 + 2*
t3 +
t4 + l0 + 2*l1 + l2 + 4)>>3;
228 src[1+1*
stride]=(
t4 + 2*
t5 +
t6 + l1 + 2*l2 + l3 + 4)>>3;
232 src[1+2*
stride]=(
t6 + 3*
t7 + l2 + 3*l3 + 4)>>3;
243 uint8_t *top = src-
stride;
246 for (y = 0; y < 4; y++) {
247 uint8_t *cm_in = cm + src[-1];
248 src[0] = cm_in[top[0]];
249 src[1] = cm_in[top[1]];
250 src[2] = cm_in[top[2]];
251 src[3] = cm_in[top[3]];
257 pred16x16_plane_compat_8_c(src, stride, 1, 0);
261 pred16x16_plane_compat_8_c(src, stride, 0, 1);
266 uint8_t *top = src-
stride;
269 for (y = 0; y < 16; y++) {
270 uint8_t *cm_in = cm + src[-1];
271 src[0] = cm_in[top[0]];
272 src[1] = cm_in[top[1]];
273 src[2] = cm_in[top[2]];
274 src[3] = cm_in[top[3]];
275 src[4] = cm_in[top[4]];
276 src[5] = cm_in[top[5]];
277 src[6] = cm_in[top[6]];
278 src[7] = cm_in[top[7]];
279 src[8] = cm_in[top[8]];
280 src[9] = cm_in[top[9]];
281 src[10] = cm_in[top[10]];
282 src[11] = cm_in[top[11]];
283 src[12] = cm_in[top[12]];
284 src[13] = cm_in[top[13]];
285 src[14] = cm_in[top[14]];
286 src[15] = cm_in[top[15]];
297 dc0+= src[-1+i*stride];
298 dc0= 0x01010101*((dc0 + 4)>>3);
301 ((uint32_t*)(src+i*stride))[0]=
302 ((uint32_t*)(src+i*
stride))[1]= dc0;
313 dc0= 0x01010101*((dc0 + 4)>>3);
316 ((uint32_t*)(src+i*stride))[0]=
317 ((uint32_t*)(src+i*
stride))[1]= dc0;
328 dc0+= src[-1+(i+4)*stride];
330 dc0= 0x01010101*((dc0 + 8)>>4);
333 ((uint32_t*)(src+i*stride))[0]= dc0;
334 ((uint32_t*)(src+i*stride))[1]= dc0;
337 ((uint32_t*)(src+i*stride))[0]= dc0;
338 ((uint32_t*)(src+i*stride))[1]= dc0;
344 uint8_t *top = src-
stride;
347 for (y = 0; y < 8; y++) {
348 uint8_t *cm_in = cm + src[-1];
349 src[0] = cm_in[top[0]];
350 src[1] = cm_in[top[1]];
351 src[2] = cm_in[top[2]];
352 src[3] = cm_in[top[3]];
353 src[4] = cm_in[top[4]];
354 src[5] = cm_in[top[5]];
355 src[6] = cm_in[top[6]];
356 src[7] = cm_in[top[7]];
369 #define FUNC(a, depth) a ## _ ## depth
370 #define FUNCC(a, depth) a ## _ ## depth ## _c
371 #define FUNCD(a) a ## _c
373 #define H264_PRED(depth) \
374 if(codec_id != CODEC_ID_RV40){\
375 if(codec_id == CODEC_ID_VP8) {\
376 h->pred4x4[VERT_PRED ]= FUNCD(pred4x4_vertical_vp8);\
377 h->pred4x4[HOR_PRED ]= FUNCD(pred4x4_horizontal_vp8);\
379 h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
380 h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
382 h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
383 if(codec_id == CODEC_ID_SVQ3)\
384 h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_svq3);\
386 h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred4x4_down_left , depth);\
387 h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
388 h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
389 h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
390 if (codec_id == CODEC_ID_VP8) {\
391 h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_vp8);\
393 h->pred4x4[VERT_LEFT_PRED ]= FUNCC(pred4x4_vertical_left , depth);\
394 h->pred4x4[HOR_UP_PRED ]= FUNCC(pred4x4_horizontal_up , depth);\
395 if(codec_id != CODEC_ID_VP8) {\
396 h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
397 h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
398 h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
400 h->pred4x4[TM_VP8_PRED ]= FUNCD(pred4x4_tm_vp8);\
401 h->pred4x4[DC_127_PRED ]= FUNCC(pred4x4_127_dc , depth);\
402 h->pred4x4[DC_129_PRED ]= FUNCC(pred4x4_129_dc , depth);\
403 h->pred4x4[VERT_VP8_PRED ]= FUNCC(pred4x4_vertical , depth);\
404 h->pred4x4[HOR_VP8_PRED ]= FUNCC(pred4x4_horizontal , depth);\
407 h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
408 h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
409 h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
410 h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_rv40);\
411 h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
412 h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
413 h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
414 h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_rv40);\
415 h->pred4x4[HOR_UP_PRED ]= FUNCD(pred4x4_horizontal_up_rv40);\
416 h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
417 h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
418 h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
419 h->pred4x4[DIAG_DOWN_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_down_left_rv40_nodown);\
420 h->pred4x4[HOR_UP_PRED_RV40_NODOWN]= FUNCD(pred4x4_horizontal_up_rv40_nodown);\
421 h->pred4x4[VERT_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_vertical_left_rv40_nodown);\
424 h->pred8x8l[VERT_PRED ]= FUNCC(pred8x8l_vertical , depth);\
425 h->pred8x8l[HOR_PRED ]= FUNCC(pred8x8l_horizontal , depth);\
426 h->pred8x8l[DC_PRED ]= FUNCC(pred8x8l_dc , depth);\
427 h->pred8x8l[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred8x8l_down_left , depth);\
428 h->pred8x8l[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred8x8l_down_right , depth);\
429 h->pred8x8l[VERT_RIGHT_PRED ]= FUNCC(pred8x8l_vertical_right , depth);\
430 h->pred8x8l[HOR_DOWN_PRED ]= FUNCC(pred8x8l_horizontal_down , depth);\
431 h->pred8x8l[VERT_LEFT_PRED ]= FUNCC(pred8x8l_vertical_left , depth);\
432 h->pred8x8l[HOR_UP_PRED ]= FUNCC(pred8x8l_horizontal_up , depth);\
433 h->pred8x8l[LEFT_DC_PRED ]= FUNCC(pred8x8l_left_dc , depth);\
434 h->pred8x8l[TOP_DC_PRED ]= FUNCC(pred8x8l_top_dc , depth);\
435 h->pred8x8l[DC_128_PRED ]= FUNCC(pred8x8l_128_dc , depth);\
437 if (chroma_format_idc <= 1) {\
438 h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x8_vertical , depth);\
439 h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x8_horizontal , depth);\
441 h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x16_vertical , depth);\
442 h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x16_horizontal , depth);\
444 if (codec_id != CODEC_ID_VP8) {\
445 if (chroma_format_idc <= 1) {\
446 h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x8_plane , depth);\
448 h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x16_plane , depth);\
451 h->pred8x8[PLANE_PRED8x8]= FUNCD(pred8x8_tm_vp8);\
452 if(codec_id != CODEC_ID_RV40 && codec_id != CODEC_ID_VP8){\
453 if (chroma_format_idc <= 1) {\
454 h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x8_dc , depth);\
455 h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x8_left_dc , depth);\
456 h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x8_top_dc , depth);\
457 h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l0t, depth);\
458 h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0lt, depth);\
459 h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l00, depth);\
460 h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0l0, depth);\
462 h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x16_dc , depth);\
463 h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x16_left_dc , depth);\
464 h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x16_top_dc , depth);\
465 h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l0t, depth);\
466 h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0lt, depth);\
467 h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l00, depth);\
468 h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0l0, depth);\
471 h->pred8x8[DC_PRED8x8 ]= FUNCD(pred8x8_dc_rv40);\
472 h->pred8x8[LEFT_DC_PRED8x8]= FUNCD(pred8x8_left_dc_rv40);\
473 h->pred8x8[TOP_DC_PRED8x8 ]= FUNCD(pred8x8_top_dc_rv40);\
474 if (codec_id == CODEC_ID_VP8) {\
475 h->pred8x8[DC_127_PRED8x8]= FUNCC(pred8x8_127_dc , depth);\
476 h->pred8x8[DC_129_PRED8x8]= FUNCC(pred8x8_129_dc , depth);\
479 if (chroma_format_idc <= 1) {\
480 h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x8_128_dc , depth);\
482 h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x16_128_dc , depth);\
485 h->pred16x16[DC_PRED8x8 ]= FUNCC(pred16x16_dc , depth);\
486 h->pred16x16[VERT_PRED8x8 ]= FUNCC(pred16x16_vertical , depth);\
487 h->pred16x16[HOR_PRED8x8 ]= FUNCC(pred16x16_horizontal , depth);\
490 h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_svq3);\
493 h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_rv40);\
496 h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_tm_vp8);\
497 h->pred16x16[DC_127_PRED8x8]= FUNCC(pred16x16_127_dc , depth);\
498 h->pred16x16[DC_129_PRED8x8]= FUNCC(pred16x16_129_dc , depth);\
501 h->pred16x16[PLANE_PRED8x8 ]= FUNCC(pred16x16_plane , depth);\
504 h->pred16x16[LEFT_DC_PRED8x8]= FUNCC(pred16x16_left_dc , depth);\
505 h->pred16x16[TOP_DC_PRED8x8 ]= FUNCC(pred16x16_top_dc , depth);\
506 h->pred16x16[DC_128_PRED8x8 ]= FUNCC(pred16x16_128_dc , depth);\
509 h->pred4x4_add [VERT_PRED ]= FUNCC(pred4x4_vertical_add , depth);\
510 h->pred4x4_add [ HOR_PRED ]= FUNCC(pred4x4_horizontal_add , depth);\
511 h->pred8x8l_add [VERT_PRED ]= FUNCC(pred8x8l_vertical_add , depth);\
512 h->pred8x8l_add [ HOR_PRED ]= FUNCC(pred8x8l_horizontal_add , depth);\
513 if (chroma_format_idc <= 1) {\
514 h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x8_vertical_add , depth);\
515 h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x8_horizontal_add , depth);\
517 h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x16_vertical_add , depth);\
518 h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x16_horizontal_add , depth);\
520 h->pred16x16_add[VERT_PRED8x8]= FUNCC(pred16x16_vertical_add , depth);\
521 h->pred16x16_add[ HOR_PRED8x8]= FUNCC(pred16x16_horizontal_add , depth);\